aboutsummaryrefslogtreecommitdiffstats
path: root/model-integration
diff options
context:
space:
mode:
authorLester Solbakken <lesters@oath.com>2021-09-14 15:29:43 +0200
committerLester Solbakken <lesters@oath.com>2021-09-14 15:29:43 +0200
commita379a7dd17c5b96147cc48c8eb4ec5c1fb32cf56 (patch)
tree89c94c208796279fd41de09a111f0c86ce630d0f /model-integration
parentc6da7caab7aabf5db505ab3043295ba7c7bc4cc8 (diff)
Set default session options for ONNX-RT stateless eval
Diffstat (limited to 'model-integration')
-rw-r--r--model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluator.java3
1 files changed, 3 insertions, 0 deletions
diff --git a/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluator.java b/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluator.java
index 51d54d719c2..b782a79f14b 100644
--- a/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluator.java
+++ b/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluator.java
@@ -30,6 +30,9 @@ public class OnnxEvaluator {
environment = OrtEnvironment.getEnvironment();
OrtSession.SessionOptions options = new OrtSession.SessionOptions();
options.setOptimizationLevel(OrtSession.SessionOptions.OptLevel.ALL_OPT);
+ options.setIntraOpNumThreads(Math.max(1, Runtime.getRuntime().availableProcessors() / 4));
+ options.setInterOpNumThreads(1);
+ options.setExecutionMode(OrtSession.SessionOptions.ExecutionMode.SEQUENTIAL);
session = environment.createSession(modelPath, options);
} catch (OrtException e) {
throw new RuntimeException("ONNX Runtime exception", e);