summaryrefslogtreecommitdiffstats
path: root/configdefinitions
diff options
context:
space:
mode:
authorBjørn Christian Seime <bjorncs@yahooinc.com>2023-06-06 09:50:12 +0200
committerGitHub <noreply@github.com>2023-06-06 09:50:12 +0200
commit4ae8a32cd71cc23501f7e1737b27e0bcac7fbd41 (patch)
tree3e31ecaaab916dd6ce1bd51b3e552e09d578e1eb /configdefinitions
parent4878116a848f0ceff01c49b67657d63a4113789d (diff)
parent6c664b24186756021e6b39801b9694d1815311bf (diff)
Merge pull request #27297 from vespa-engine/bjorncs/bert-embedder-services-xml
Bjorncs/bert embedder services xml
Diffstat (limited to 'configdefinitions')
-rw-r--r--configdefinitions/src/vespa/embedding.bert-base-embedder.def32
-rw-r--r--configdefinitions/src/vespa/hugging-face-embedder.def2
2 files changed, 34 insertions, 0 deletions
diff --git a/configdefinitions/src/vespa/embedding.bert-base-embedder.def b/configdefinitions/src/vespa/embedding.bert-base-embedder.def
new file mode 100644
index 00000000000..2d8e840377b
--- /dev/null
+++ b/configdefinitions/src/vespa/embedding.bert-base-embedder.def
@@ -0,0 +1,32 @@
+
+namespace=embedding
+
+# Wordpiece tokenizer
+tokenizerVocab model
+
+transformerModel model
+
+# Max length of token sequence model can handle
+transformerMaxTokens int default=384
+
+# Pooling strategy
+poolingStrategy enum { cls, mean } default=mean
+
+# Input names
+transformerInputIds string default=input_ids
+transformerAttentionMask string default=attention_mask
+transformerTokenTypeIds string default=token_type_ids
+
+# special token ids
+transformerStartSequenceToken int default=101
+transformerEndSequenceToken int default=102
+
+# Output name
+transformerOutput string default=output_0
+
+# Settings for ONNX model evaluation
+onnxExecutionMode enum { parallel, sequential } default=sequential
+onnxInterOpThreads int default=1
+onnxIntraOpThreads int default=-4 # n=number of threads -> n<0: CPUs/(-n), n==0: CPUs, n>0: n
+# GPU device id, -1 for CPU
+onnxGpuDevice int default=0
diff --git a/configdefinitions/src/vespa/hugging-face-embedder.def b/configdefinitions/src/vespa/hugging-face-embedder.def
index 36957004e02..7ea4227b3cd 100644
--- a/configdefinitions/src/vespa/hugging-face-embedder.def
+++ b/configdefinitions/src/vespa/hugging-face-embedder.def
@@ -21,6 +21,8 @@ transformerOutput string default=last_hidden_state
# Normalize tensors from tokenizer
normalize bool default=false
+poolingStrategy enum { cls, mean } default=mean
+
# Settings for ONNX model evaluation
transformerExecutionMode enum { parallel, sequential } default=sequential
transformerInterOpThreads int default=1