diff options
author | Bjørn Christian Seime <bjorncs@yahooinc.com> | 2023-06-06 09:50:12 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-06-06 09:50:12 +0200 |
commit | 4ae8a32cd71cc23501f7e1737b27e0bcac7fbd41 (patch) | |
tree | 3e31ecaaab916dd6ce1bd51b3e552e09d578e1eb /model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def | |
parent | 4878116a848f0ceff01c49b67657d63a4113789d (diff) | |
parent | 6c664b24186756021e6b39801b9694d1815311bf (diff) |
Merge pull request #27297 from vespa-engine/bjorncs/bert-embedder-services-xml
Bjorncs/bert embedder services xml
Diffstat (limited to 'model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def')
-rw-r--r-- | model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def | 32 |
1 files changed, 0 insertions, 32 deletions
diff --git a/model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def b/model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def deleted file mode 100644 index 2d8e840377b..00000000000 --- a/model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def +++ /dev/null @@ -1,32 +0,0 @@ - -namespace=embedding - -# Wordpiece tokenizer -tokenizerVocab model - -transformerModel model - -# Max length of token sequence model can handle -transformerMaxTokens int default=384 - -# Pooling strategy -poolingStrategy enum { cls, mean } default=mean - -# Input names -transformerInputIds string default=input_ids -transformerAttentionMask string default=attention_mask -transformerTokenTypeIds string default=token_type_ids - -# special token ids -transformerStartSequenceToken int default=101 -transformerEndSequenceToken int default=102 - -# Output name -transformerOutput string default=output_0 - -# Settings for ONNX model evaluation -onnxExecutionMode enum { parallel, sequential } default=sequential -onnxInterOpThreads int default=1 -onnxIntraOpThreads int default=-4 # n=number of threads -> n<0: CPUs/(-n), n==0: CPUs, n>0: n -# GPU device id, -1 for CPU -onnxGpuDevice int default=0 |