diff options
Diffstat (limited to 'configdefinitions/src/vespa/embedding.bert-base-embedder.def')
-rw-r--r-- | configdefinitions/src/vespa/embedding.bert-base-embedder.def | 27 |
1 files changed, 27 insertions, 0 deletions
diff --git a/configdefinitions/src/vespa/embedding.bert-base-embedder.def b/configdefinitions/src/vespa/embedding.bert-base-embedder.def new file mode 100644 index 00000000000..a37599de411 --- /dev/null +++ b/configdefinitions/src/vespa/embedding.bert-base-embedder.def @@ -0,0 +1,27 @@ + +namespace=embedding + +# Transformer model settings +transformerModelUrl url default=https://data.vespa.oath.cloud/onnx_models/sentence_all_MiniLM_L6_v2.onnx + +# Max length of token sequence model can handle +transformerMaxTokens int default=384 + +# Pooling strategy +poolingStrategy enum { cls, mean } default=mean + +# Input names +transformerInputIds string default=input_ids +transformerAttentionMask string default=attention_mask +transformerTokenTypeIds string default=token_type_ids + +# Output name +transformerOutput string default=output_0 + +# Settings for ONNX model evaluation +onnxExecutionMode enum { parallel, sequential } default=sequential +onnxInterOpThreads int default=1 +onnxIntraOpThreads int default=-4 # n=number of threads -> n<0: CPUs/(-n), n==0: CPUs, n>0: n + +# Settings for wordpiece tokenizer +tokenizerVocabUrl url default=https://data.vespa.oath.cloud/onnx_models/bert-base-uncased-vocab.txt |