diff options
author | Bjørn Christian Seime <bjorncs@vespa.ai> | 2023-10-19 10:55:44 +0200 |
---|---|---|
committer | Bjørn Christian Seime <bjorncs@vespa.ai> | 2023-10-19 10:55:44 +0200 |
commit | 2881a0fea93a519b9a1df24c02e9462e5da3c368 (patch) | |
tree | 76b4963f836c1d6b984048f95a0c3509e78de0b0 /model-integration | |
parent | 479379d864392f3d6de5c6c78e03214021994d4f (diff) |
Disable CPU arena allocator for ONNX
The arena memory allocator pre-allocates excessive of memory up front.
Disabling matches the existing configuration in ONNX integration for backend.
Diffstat (limited to 'model-integration')
-rw-r--r-- | model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java | 1 |
1 files changed, 1 insertions, 0 deletions
diff --git a/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java b/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java index 6dd2c5b05af..cefafc3654b 100644 --- a/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java +++ b/model-integration/src/main/java/ai/vespa/modelintegration/evaluator/OnnxEvaluatorOptions.java @@ -41,6 +41,7 @@ public class OnnxEvaluatorOptions { options.setExecutionMode(executionMode); options.setInterOpNumThreads(executionMode == PARALLEL ? interOpThreads : 1); options.setIntraOpNumThreads(intraOpThreads); + options.setCPUArenaAllocator(false); if (loadCuda) { options.addCUDA(gpuDeviceNumber); } |