diff options
Diffstat (limited to 'vespalib/src/vespa/vespalib/text/lowercase.cpp')
-rw-r--r-- | vespalib/src/vespa/vespalib/text/lowercase.cpp | 12 |
1 files changed, 12 insertions, 0 deletions
diff --git a/vespalib/src/vespa/vespalib/text/lowercase.cpp b/vespalib/src/vespa/vespalib/text/lowercase.cpp index 604027d2687..de6c5956fcb 100644 --- a/vespalib/src/vespa/vespalib/text/lowercase.cpp +++ b/vespalib/src/vespa/vespalib/text/lowercase.cpp @@ -20,6 +20,18 @@ LowerCase::convert(vespalib::stringref input) return output; } +std::vector<uint32_t> +LowerCase::convert_to_ucs4(vespalib::stringref input) +{ + std::vector<uint32_t> result; + result.reserve(input.size()); + Utf8Reader reader(input.data()); + while (reader.hasMore()) { + result.emplace_back(convert(reader.getChar())); + } + return result; +} + /* NOTE: the tables below are generated from Java code to |