diff options
Diffstat (limited to 'indexinglanguage/src/main/javacc/IndexingParser.jj')
-rw-r--r-- | indexinglanguage/src/main/javacc/IndexingParser.jj | 3 |
1 files changed, 3 insertions, 0 deletions
diff --git a/indexinglanguage/src/main/javacc/IndexingParser.jj b/indexinglanguage/src/main/javacc/IndexingParser.jj index ea05f33d745..42bbd26cee6 100644 --- a/indexinglanguage/src/main/javacc/IndexingParser.jj +++ b/indexinglanguage/src/main/javacc/IndexingParser.jj @@ -173,6 +173,7 @@ TOKEN : <JOIN: "join"> | <LOWER_CASE: "lowercase"> | <MAX_LENGTH: "max-length"> | + <MAX_OCCURRENCES: "max-occurrences"> | <NGRAM: "ngram"> | <NORMALIZE: "normalize"> | <NOW: "now"> | @@ -664,10 +665,12 @@ AnnotatorConfig tokenizeCfg() : AnnotatorConfig val = new AnnotatorConfig(annotatorCfg); String str = "SHORTEST"; Integer maxLength; + Integer maxTermOccurrences; } { ( <STEM> ( <COLON> str = string() ) ? { val.setStemMode(str); } | <MAX_LENGTH> <COLON> maxLength = integer() { val.setMaxTokenLength(maxLength); } | + <MAX_OCCURRENCES> <COLON> maxTermOccurrences = integer() { val.setMaxTermOccurrences(maxTermOccurrences); } | <NORMALIZE> { val.setRemoveAccents(true); } )+ { return val; } } |