38446.patch - Redmine

Feature #38446 » 38446.patch

Go MAEDA, 2024-04-29 04:28

           def tokens
             # extract tokens from the question
             # eg. hello "bye bye" => ["hello", "bye bye"]
             tokens = @question.scan(%r{(([[:space:]]|^)"[^"]+"([[:space:]]|$)|[[:^space:]]+)}).collect {|m| m.first.gsub(%r{(^[[:space:]]*"[[:space:]]*|[[:space:]]*"[[:space:]]*$)}, '')}
             tokens = @question.scan(/"[^"]+"|[[:^space:]]+/).map do |token|
               # Remove quotes from quoted tokens, strip surrounding whitespace
               token.gsub(/"\s*|\s*"/, '').gsub(/^[[:space:]]+|[[:space:]]+$/, '')
             end
             # tokens must be at least 2 characters long
             # but for Chinese characters (Chinese HANZI/Japanese KANJI), tokens can be one character
             # no more than 5 tokens to search for

         value = "全角\u3000スペース"
         assert_equal %w[全角 スペース], Redmine::Search::Tokenizer.new(value).tokens
       end
       def test_tokenize_should_support_multiple_phrases
         value = '"phrase one" "phrase two"'
         assert_equal ["phrase one", "phrase two"], Redmine::Search::Tokenizer.new(value).tokens
       end
     end

(1-1/2)