aboutsummaryrefslogtreecommitdiffstats
path: root/linguistics-components/src/main/resources/configdefinitions
diff options
context:
space:
mode:
authorBjørn Christian Seime <bjorncs@yahooinc.com>2023-05-12 10:21:48 +0200
committerBjørn Christian Seime <bjorncs@yahooinc.com>2023-05-12 10:21:48 +0200
commite030993d0c356ba6acd50c3e64da5a1f6e1538fd (patch)
tree853878e89743d224a67ba6edb44ec803e1ca9bcf /linguistics-components/src/main/resources/configdefinitions
parentbef1950a75be8b256df07ca5ef6aacd1731c5ef9 (diff)
Revert "Revert "Bjorncs/huggingface tokenizer""
This reverts commit 2bb74878879b3acb1919fd658b8f2c476d8129d6.
Diffstat (limited to 'linguistics-components/src/main/resources/configdefinitions')
-rw-r--r--linguistics-components/src/main/resources/configdefinitions/language.huggingface.hugging-face-tokenizer.def11
1 files changed, 11 insertions, 0 deletions
diff --git a/linguistics-components/src/main/resources/configdefinitions/language.huggingface.hugging-face-tokenizer.def b/linguistics-components/src/main/resources/configdefinitions/language.huggingface.hugging-face-tokenizer.def
new file mode 100644
index 00000000000..a3e54ea38da
--- /dev/null
+++ b/linguistics-components/src/main/resources/configdefinitions/language.huggingface.hugging-face-tokenizer.def
@@ -0,0 +1,11 @@
+# Copyright Yahoo. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
+
+namespace=language.huggingface
+
+# The language a model is for, one of the language tags in com.yahoo.language.Language.
+# Use "unknown" for models to be used with any language.
+model[].language string
+# The path to the model relative to the application package root
+model[].path path
+
+addSpecialTokens bool default=true \ No newline at end of file