diff options
author | Lester Solbakken <lester.solbakken@gmail.com> | 2024-04-16 13:45:27 +0200 |
---|---|---|
committer | Lester Solbakken <lester.solbakken@gmail.com> | 2024-04-16 13:45:27 +0200 |
commit | 8d69cbfb97cc4047f1e952ddbef7c52a74d5a2ef (patch) | |
tree | 1cc6a1a236fac8b479472161a2560cc29e683d8a | |
parent | 66b57cd4feba406e4b8f6821c88d914ac5a5cec1 (diff) |
Add test LLMs to ModelIdResolver
-rw-r--r-- | config-model/src/main/java/com/yahoo/vespa/model/container/xml/ModelIdResolver.java | 6 |
1 files changed, 5 insertions, 1 deletions
diff --git a/config-model/src/main/java/com/yahoo/vespa/model/container/xml/ModelIdResolver.java b/config-model/src/main/java/com/yahoo/vespa/model/container/xml/ModelIdResolver.java index f9993b770e5..867ac86f8d5 100644 --- a/config-model/src/main/java/com/yahoo/vespa/model/container/xml/ModelIdResolver.java +++ b/config-model/src/main/java/com/yahoo/vespa/model/container/xml/ModelIdResolver.java @@ -26,6 +26,7 @@ public class ModelIdResolver { public static final String ONNX_MODEL = "onnx-model"; public static final String BERT_VOCAB = "bert-vocabulary"; public static final String SIGNIFICANCE_MODEL = "significance-model"; + public static final String GGUF_MODEL = "gguf-model"; private static Map<String, ProvidedModel> setupProvidedModels() { var m = new HashMap<String, ProvidedModel>(); @@ -60,6 +61,9 @@ public class ModelIdResolver { register(m, "e5-large-v2", "https://data.vespa.oath.cloud/onnx_models/e5-large-v2/model.onnx", Set.of(ONNX_MODEL)); register(m, "e5-large-v2-vocab", "https://data.vespa.oath.cloud/onnx_models/e5-large-v2/tokenizer.json", Set.of(HF_TOKENIZER)); + + register(m, "mistral-7b", "https://data.vespa.oath.cloud/gguf_models/mistral-7b-instruct-v0.1.Q6_K.gguf", Set.of(GGUF_MODEL)); + register(m, "mistral-7b-q8", "https://data.vespa.oath.cloud/gguf_models/mistral-7b-instruct-v0.1.Q8_0.gguf", Set.of(GGUF_MODEL)); return Map.copyOf(m); } @@ -124,7 +128,7 @@ public class ModelIdResolver { throw new IllegalArgumentException("Unknown model id '" + modelId + "' on '" + valueName + "'. Available models are [" + providedModels.keySet().stream().sorted().collect(Collectors.joining(", ")) + "]"); var providedModel = providedModels.get(modelId); - if (!providedModel.tags().containsAll(requiredTags)) { + if ( ! providedModel.tags().containsAll(requiredTags)) { throw new IllegalArgumentException( "Model '%s' on '%s' has tags %s but are missing required tags %s" .formatted(modelId, valueName, providedModel.tags(), requiredTags)); |