summaryrefslogtreecommitdiffstats
path: root/model-integration/src
diff options
context:
space:
mode:
authorLester Solbakken <lesters@oath.com>2022-04-06 15:42:16 +0200
committerLester Solbakken <lesters@oath.com>2022-04-06 15:42:16 +0200
commit0040e513d9ebf634130615dde62b2908c4aa9aa1 (patch)
tree9d153ffe7204cf2a7d1b744cb94ed962c68c72e2 /model-integration/src
parent7359332a2a806c84c2e504da60b9c5b087e81747 (diff)
Move embedder config def to configdefinitions and serialize as reference
Diffstat (limited to 'model-integration/src')
-rw-r--r--model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def27
1 files changed, 0 insertions, 27 deletions
diff --git a/model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def b/model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def
deleted file mode 100644
index a37599de411..00000000000
--- a/model-integration/src/main/resources/configdefinitions/embedding.bert-base-embedder.def
+++ /dev/null
@@ -1,27 +0,0 @@
-
-namespace=embedding
-
-# Transformer model settings
-transformerModelUrl url default=https://data.vespa.oath.cloud/onnx_models/sentence_all_MiniLM_L6_v2.onnx
-
-# Max length of token sequence model can handle
-transformerMaxTokens int default=384
-
-# Pooling strategy
-poolingStrategy enum { cls, mean } default=mean
-
-# Input names
-transformerInputIds string default=input_ids
-transformerAttentionMask string default=attention_mask
-transformerTokenTypeIds string default=token_type_ids
-
-# Output name
-transformerOutput string default=output_0
-
-# Settings for ONNX model evaluation
-onnxExecutionMode enum { parallel, sequential } default=sequential
-onnxInterOpThreads int default=1
-onnxIntraOpThreads int default=-4 # n=number of threads -> n<0: CPUs/(-n), n==0: CPUs, n>0: n
-
-# Settings for wordpiece tokenizer
-tokenizerVocabUrl url default=https://data.vespa.oath.cloud/onnx_models/bert-base-uncased-vocab.txt