diff options
Diffstat (limited to 'lowercasing_test/src/tests/lowercasing/CasingVariants.java')
-rw-r--r-- | lowercasing_test/src/tests/lowercasing/CasingVariants.java | 34 |
1 files changed, 34 insertions, 0 deletions
diff --git a/lowercasing_test/src/tests/lowercasing/CasingVariants.java b/lowercasing_test/src/tests/lowercasing/CasingVariants.java new file mode 100644 index 00000000000..aa1bf8fcf4d --- /dev/null +++ b/lowercasing_test/src/tests/lowercasing/CasingVariants.java @@ -0,0 +1,34 @@ +// Copyright 2016 Yahoo Inc. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. +import static com.yahoo.language.LinguisticsCase.toLowerCase; + +import java.io.File; +import java.io.FileInputStream; +import java.io.FileNotFoundException; +import java.io.IOException; +import java.io.InputStream; +import java.io.InputStreamReader; +import java.io.Reader; + +import com.yahoo.text.Utf8; + +public class CasingVariants { + + public static void main(String[] args) throws FileNotFoundException, IOException { + int read = 0; + char[] buffer = new char[5000]; + String raw; + File f = new File("./letters"); + StringBuilder s = new StringBuilder(); + InputStream in = new FileInputStream(f); + + Reader r = new InputStreamReader(in, Utf8.getCharset()); + while (read != -1) { + read = r.read(buffer); + if (read > 0) { + s.append(buffer, 0, read); + } + } + raw = s.toString(); + System.out.write(Utf8.toBytes(toLowerCase(raw))); + } +} |