1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
|
// Copyright Yahoo. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
package com.yahoo.schema;
import org.junit.Ignore;
import org.junit.Test;
import java.util.function.Function;
import java.util.regex.Pattern;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
/**
* Tests rank feature names.
*
* @author bratseth
*/
public class FeatureNamesTestCase {
@Test
public void testArgument() {
assertFalse(FeatureNames.argumentOf("foo(bar)").isPresent());
assertFalse(FeatureNames.argumentOf("foo(bar.baz)").isPresent());
assertEquals("bar", FeatureNames.argumentOf("query(bar)").get());
assertEquals("bar.baz", FeatureNames.argumentOf("query(bar.baz)").get());
assertEquals("bar", FeatureNames.argumentOf("attribute(bar)").get());
assertEquals("bar.baz", FeatureNames.argumentOf("attribute(bar.baz)").get());
assertEquals("bar", FeatureNames.argumentOf("constant(bar)").get());
assertEquals("bar.baz", FeatureNames.argumentOf("constant(bar.baz)").get());
}
@Test
public void testConstantFeature() {
assertEquals("constant(foo)",
FeatureNames.asConstantFeature("foo").toString());
}
@Test
public void testAttributeFeature() {
assertEquals("attribute(foo)",
FeatureNames.asAttributeFeature("foo").toString());
}
@Test
public void testQueryFeature() {
assertEquals("query(\"foo.bar\")",
FeatureNames.asQueryFeature("foo.bar").toString());
}
@Test
public void testLegalFeatureNames() {
assertTrue(FeatureNames.notNeedQuotes("_"));
assertFalse(FeatureNames.notNeedQuotes("-"));
assertTrue(FeatureNames.notNeedQuotes("_-"));
assertTrue(FeatureNames.notNeedQuotes("0_-azAZxy98-_"));
assertFalse(FeatureNames.notNeedQuotes("0_-azAZxy98-_+"));
}
@Test
@Ignore
/*
* Unignore to verify performance
* 2021/09/05 performance was a factor of 5.25
* 'Identifier handcoded validity check took 4301ms
* Identifier regexp validity check took 22609ms'
*/
public void benchMarkPatternMatching() {
Pattern identifierRegexp = Pattern.compile("[A-Za-z0-9_][A-Za-z0-9_-]*");
String[] strings = new String[1000];
for (int i = 0; i < strings.length; i++) {
strings[i] = i + "-legal_string" + i;
}
countValid(strings, 1000, "handcoded warmup", FeatureNames::notNeedQuotes);
countValid(strings, 1000, "regexp warmup", (s) -> identifierRegexp.matcher(s).matches());
countValid(strings, 100000, "handcoded", FeatureNames::notNeedQuotes);
countValid(strings, 100000, "regexp", (s) -> identifierRegexp.matcher(s).matches());
}
private void countValid(String [] strings, int numReps, String text, Function<String, Boolean> func) {
long start = System.nanoTime();
int validCount = 0;
for (int i = 0; i < numReps; i++) {
for (String s : strings) {
if (func.apply(s)) validCount++;
}
}
long end = System.nanoTime();
assertEquals(strings.length * numReps, validCount);
System.out.println("Identifier " + text + " validity check took " + (end - start)/1000000 + "ms");
}
}
|