summaryrefslogtreecommitdiffstats
path: root/model-integration
diff options
context:
space:
mode:
authorBjørn Christian Seime <bjorncs@vespa.ai>2023-10-19 10:55:44 +0200
committerBjørn Christian Seime <bjorncs@vespa.ai>2023-10-19 10:55:44 +0200
commit2881a0fea93a519b9a1df24c02e9462e5da3c368 (patch)
tree76b4963f836c1d6b984048f95a0c3509e78de0b0 /model-integration
parent479379d864392f3d6de5c6c78e03214021994d4f (diff)
Disable CPU arena allocator for ONNX
The arena memory allocator pre-allocates excessive of memory up front. Disabling matches the existing configuration in ONNX integration for backend.
Diffstat (limited to 'model-integration')
-rw-r--r--model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java1
1 files changed, 1 insertions, 0 deletions
diff --git a/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java b/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java
index 6dd2c5b05af..cefafc3654b 100644
--- a/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java
+++ b/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java
@@ -41,6 +41,7 @@ public class OnnxEvaluatorOptions {
options.setExecutionMode(executionMode);
options.setInterOpNumThreads(executionMode == PARALLEL ? interOpThreads : 1);
options.setIntraOpNumThreads(intraOpThreads);
+ options.setCPUArenaAllocator(false);
if (loadCuda) {
options.addCUDA(gpuDeviceNumber);
}