aboutsummaryrefslogtreecommitdiffstats
path: root/container-search
diff options
context:
space:
mode:
authorJon Bratseth <bratseth@vespa.ai>2023-05-22 11:47:54 +0200
committerJon Bratseth <bratseth@vespa.ai>2023-05-22 11:47:54 +0200
commit179a1d90ca76fa61bcbeb3967a58fd3e9b5e9654 (patch)
treef24eccc59c5d4f8d2caf8945ad0323c9143f5e53 /container-search
parentc7a07adf43c13165e49e2aa2ef509ecb2526a48c (diff)
Threat 'other symbols' as letters
The unicode class 'other symbols' contains emojis, math symbols, etc. Treat these as letter characters to support searching for them.
Diffstat (limited to 'container-search')
-rw-r--r--container-search/src/test/java/com/yahoo/prelude/query/parser/test/ParseTestCase.java12
1 files changed, 12 insertions, 0 deletions
diff --git a/container-search/src/test/java/com/yahoo/prelude/query/parser/test/ParseTestCase.java b/container-search/src/test/java/com/yahoo/prelude/query/parser/test/ParseTestCase.java
index 583e89bacd6..475b7beb879 100644
--- a/container-search/src/test/java/com/yahoo/prelude/query/parser/test/ParseTestCase.java
+++ b/container-search/src/test/java/com/yahoo/prelude/query/parser/test/ParseTestCase.java
@@ -2580,4 +2580,16 @@ public class ParseTestCase {
void testNoGrammar4() {
tester.assertParsed("WEAKAND(100) foo bar baz one two 37", "foo -(bar baz \"one two\" 37)", Query.Type.TOKENIZE);
}
+
+ @Test
+ void testEmojis() {
+ String emoji1 = "\uD83D\uDD2A"; // 🔪
+ tester.assertParsed(emoji1, emoji1, Query.Type.ANY);
+
+ String emoji2 = "\uD83D\uDE00"; // 😀
+ tester.assertParsed(emoji2, emoji2, Query.Type.ANY);
+
+ tester.assertParsed(emoji1 + emoji2, emoji1 + emoji2, Query.Type.ANY);
+ }
+
}