diff options
author | Henning Baldersheim <balder@yahoo-inc.com> | 2023-12-19 17:02:19 +0000 |
---|---|---|
committer | Henning Baldersheim <balder@yahoo-inc.com> | 2024-01-04 10:42:37 +0000 |
commit | 0f9915ebdfb2931ebb3c06ac55b537f42477256b (patch) | |
tree | a6f3a41e547c032d773ef391da22ca04bcfcacc3 /streamingvisitors/src/vespa/vsm/searcher/utf8stringfieldsearcherbase.cpp | |
parent | 5f1ec31a0decec88322835705afa26cc7d35fd3e (diff) |
- Modernize code
- Unify some conversion tables.
Diffstat (limited to 'streamingvisitors/src/vespa/vsm/searcher/utf8stringfieldsearcherbase.cpp')
-rw-r--r-- | streamingvisitors/src/vespa/vsm/searcher/utf8stringfieldsearcherbase.cpp | 13 |
1 files changed, 0 insertions, 13 deletions
diff --git a/streamingvisitors/src/vespa/vsm/searcher/utf8stringfieldsearcherbase.cpp b/streamingvisitors/src/vespa/vsm/searcher/utf8stringfieldsearcherbase.cpp index c31102ec0ab..ebdf69d0b30 100644 --- a/streamingvisitors/src/vespa/vsm/searcher/utf8stringfieldsearcherbase.cpp +++ b/streamingvisitors/src/vespa/vsm/searcher/utf8stringfieldsearcherbase.cpp @@ -32,10 +32,8 @@ UTF8StringFieldSearcherBase::tokenize(const byte * p, size_t maxSz, cmptype_t * c = *p; } } else { - const byte * oldP(p); c = Fast_UnicodeUtil::GetUTF8CharNonAscii(p); if (Fast_UnicodeUtil::IsWordChar(c)) { - _utf8Count[p-oldP-1]++; const char *repl = Fast_NormalizeWordFolder::ReplacementString(c); if (repl != nullptr) { size_t repllen = strlen(repl); @@ -50,8 +48,6 @@ UTF8StringFieldSearcherBase::tokenize(const byte * p, size_t maxSz, cmptype_t * } else { if (c == Fast_UnicodeUtil::_BadUTF8Char) { _badUtf8Count++; - } else { - _utf8Count[p-oldP-1]++; } c = *p; } @@ -70,10 +66,8 @@ UTF8StringFieldSearcherBase::tokenize(const byte * p, size_t maxSz, cmptype_t * c = *p; } } else { - const byte * oldP(p); c = Fast_UnicodeUtil::GetUTF8CharNonAscii(p); if (__builtin_expect(Fast_UnicodeUtil::IsWordChar(c), false)) { - _utf8Count[p-oldP-1]++; const char *repl = Fast_NormalizeWordFolder::ReplacementString(c); if (repl != nullptr) { size_t repllen = strlen(repl); @@ -89,8 +83,6 @@ UTF8StringFieldSearcherBase::tokenize(const byte * p, size_t maxSz, cmptype_t * } else { if (c == Fast_UnicodeUtil::_BadUTF8Char) { _badUtf8Count++; - } else { - _utf8Count[p-oldP-1]++; } break; } @@ -128,7 +120,6 @@ UTF8StringFieldSearcherBase::matchTermRegular(const FieldRef & f, QueryTerm & qt } words++; } - NEED_CHAR_STAT(addAnyUtf8Field(f.size())); return words; } @@ -154,7 +145,6 @@ UTF8StringFieldSearcherBase::matchTermExact(const FieldRef & f, QueryTerm & qt) addHit(qt,0); } } - NEED_CHAR_STAT(addAnyUtf8Field(f.size())); return 1; } @@ -188,7 +178,6 @@ UTF8StringFieldSearcherBase::matchTermSubstring(const FieldRef & f, QueryTerm & } } } - NEED_CHAR_STAT(addAnyUtf8Field(f.size())); return words + 1; // we must also count the last word } @@ -305,8 +294,6 @@ UTF8StringFieldSearcherBase::skipSeparators(const search::byte * p, size_t sz, T } if (c == Fast_UnicodeUtil::_BadUTF8Char) { _badUtf8Count++; - } else { - _utf8Count[p-oldP-1]++; } } } |