summaryrefslogtreecommitdiffstats
path: root/lowercasing_test/src/tests/lowercasing/CasingVariants.java
diff options
context:
space:
mode:
Diffstat (limited to 'lowercasing_test/src/tests/lowercasing/CasingVariants.java')
-rw-r--r--lowercasing_test/src/tests/lowercasing/CasingVariants.java34
1 files changed, 34 insertions, 0 deletions
diff --git a/lowercasing_test/src/tests/lowercasing/CasingVariants.java b/lowercasing_test/src/tests/lowercasing/CasingVariants.java
new file mode 100644
index 00000000000..aa1bf8fcf4d
--- /dev/null
+++ b/lowercasing_test/src/tests/lowercasing/CasingVariants.java
@@ -0,0 +1,34 @@
+// Copyright 2016 Yahoo Inc. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
+import static com.yahoo.language.LinguisticsCase.toLowerCase;
+
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.FileNotFoundException;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.io.Reader;
+
+import com.yahoo.text.Utf8;
+
+public class CasingVariants {
+
+ public static void main(String[] args) throws FileNotFoundException, IOException {
+ int read = 0;
+ char[] buffer = new char[5000];
+ String raw;
+ File f = new File("./letters");
+ StringBuilder s = new StringBuilder();
+ InputStream in = new FileInputStream(f);
+
+ Reader r = new InputStreamReader(in, Utf8.getCharset());
+ while (read != -1) {
+ read = r.read(buffer);
+ if (read > 0) {
+ s.append(buffer, 0, read);
+ }
+ }
+ raw = s.toString();
+ System.out.write(Utf8.toBytes(toLowerCase(raw)));
+ }
+}