diff options
author | Jo Kristian Bergum <bergum@yahooinc.com> | 2023-09-21 12:02:08 +0200 |
---|---|---|
committer | Jo Kristian Bergum <bergum@yahooinc.com> | 2023-09-21 12:02:08 +0200 |
commit | d4692ee4fe82f34958679f0f87777a6e5c23d8db (patch) | |
tree | 3c070c4c5a624482d7639561e972544d8e456fde /configdefinitions | |
parent | 7faeffcc5901ae88c1c3d1814665d0db6ca1d900 (diff) |
Add ColBERT embedder
Diffstat (limited to 'configdefinitions')
-rw-r--r-- | configdefinitions/src/vespa/col-bert-embedder.def | 36 |
1 files changed, 36 insertions, 0 deletions
diff --git a/configdefinitions/src/vespa/col-bert-embedder.def b/configdefinitions/src/vespa/col-bert-embedder.def new file mode 100644 index 00000000000..c7944847d8b --- /dev/null +++ b/configdefinitions/src/vespa/col-bert-embedder.def @@ -0,0 +1,36 @@ + +namespace=embedding + +# Path to tokenizer.json +tokenizerPath model + +# Path to model.onnx +transformerModel model + +# Max query tokens for ColBERT +maxQueryTokens int default=32 + +# Max document query tokens for ColBERT +maxDocumentTokens int default=512 + +# Max length of token sequence model can handle +transformerMaxTokens int default=512 + +# Input names +transformerInputIds string default=input_ids +transformerAttentionMask string default=attention_mask + +# special token ids +transformerStartSequenceToken int default=101 +transformerEndSequenceToken int default=102 +transformerMaskToken int default=103 + +# Output name +transformerOutput string default=contextual + +# Settings for ONNX model evaluation +transformerExecutionMode enum { parallel, sequential } default=sequential +transformerInterOpThreads int default=1 +transformerIntraOpThreads int default=-4 +# GPU device id, -1 for CPU +transformerGpuDevice int default=0 |