diff options
Diffstat (limited to 'configdefinitions/src/vespa/hugging-face-embedder.def')
-rw-r--r-- | configdefinitions/src/vespa/hugging-face-embedder.def | 31 |
1 files changed, 31 insertions, 0 deletions
diff --git a/configdefinitions/src/vespa/hugging-face-embedder.def b/configdefinitions/src/vespa/hugging-face-embedder.def new file mode 100644 index 00000000000..7ea4227b3cd --- /dev/null +++ b/configdefinitions/src/vespa/hugging-face-embedder.def @@ -0,0 +1,31 @@ +namespace=embedding.huggingface + +# Path to tokenizer.json +tokenizerPath model + +# Path to model.onnx +transformerModel model + +# Max length of token sequence model can handle +transformerMaxTokens int default=512 + +# Input names +transformerInputIds string default=input_ids +transformerAttentionMask string default=attention_mask +transformerTokenTypeIds string default=token_type_ids + +# Output name +transformerOutput string default=last_hidden_state + + +# Normalize tensors from tokenizer +normalize bool default=false + +poolingStrategy enum { cls, mean } default=mean + +# Settings for ONNX model evaluation +transformerExecutionMode enum { parallel, sequential } default=sequential +transformerInterOpThreads int default=1 +transformerIntraOpThreads int default=-4 +# GPU device id, -1 for CPU +transformerGpuDevice int default=0 |