aboutsummaryrefslogtreecommitdiffstats
path: root/linguistics/src/test/java/com/yahoo/language/simple/SimpleTokenTypeTestCase.java
blob: afea3c33721b9b513ce3aa17529131927f9535a3 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
// Copyright Yahoo. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
package com.yahoo.language.simple;

import com.yahoo.language.process.TokenType;
import org.junit.Test;

import static org.junit.Assert.assertEquals;

/**
 * Check simple token types.
 *
 * @author Steinar Knutsen
 */
public class SimpleTokenTypeTestCase {

    @Test
    public final void test() {
        assertEquals(TokenType.ALPHABETIC, tokenType('a'));
        assertEquals(TokenType.ALPHABETIC, tokenType('\u02c1'));
        assertEquals(TokenType.ALPHABETIC, tokenType('\u02c1'));
        assertEquals(TokenType.ALPHABETIC, tokenType('\u01c0'));
        assertEquals(TokenType.SYMBOL, tokenType('\u20dd'));
        assertEquals(TokenType.ALPHABETIC, tokenType('\u0912'));
        assertEquals(TokenType.NUMERIC, tokenType('1'));
        assertEquals(TokenType.PUNCTUATION, tokenType('.'));
        assertEquals(TokenType.PUNCTUATION, tokenType('\u0f3b'));
        assertEquals(TokenType.PUNCTUATION, tokenType('\u0f3c'));
        assertEquals(TokenType.PUNCTUATION, tokenType('\u203f'));
        assertEquals(TokenType.SYMBOL, tokenType('\u2044'));
        assertEquals(TokenType.SYMBOL, tokenType('$'));
        assertEquals(TokenType.ALPHABETIC, tokenType('\u2132'));
        assertEquals(TokenType.ALPHABETIC, tokenType('\uD800', '\uDFC8'));
    }

    private static TokenType tokenType(char c) {
        return SimpleTokenType.valueOf(c);
    }

    private static TokenType tokenType(char high, char low) {
        return SimpleTokenType.valueOf(Character.toCodePoint(high, low));
    }

}