diff options
author | Henning Baldersheim <balder@yahoo-inc.com> | 2023-03-17 10:08:51 +0000 |
---|---|---|
committer | Henning Baldersheim <balder@yahoo-inc.com> | 2023-03-17 10:08:51 +0000 |
commit | 94598bd6506f6a0e5fca79a887bdc1fc1d36c64d (patch) | |
tree | 4ecdc8aa41497552a1f84ba908d3e43be43989b5 | |
parent | f734fd1a7e9213f79782567285b5c3d72c5107ab (diff) |
Add TODO of proton configs that can be clean up and TODO for configs to check.
-rw-r--r-- | searchcore/src/vespa/searchcore/config/proton.def | 84 |
1 files changed, 50 insertions, 34 deletions
diff --git a/searchcore/src/vespa/searchcore/config/proton.def b/searchcore/src/vespa/searchcore/config/proton.def index 375ff0f2012..e85e6c58e11 100644 --- a/searchcore/src/vespa/searchcore/config/proton.def +++ b/searchcore/src/vespa/searchcore/config/proton.def @@ -129,10 +129,6 @@ indexing.write.io enum {NORMAL, OSYNC, DIRECTIO} default=DIRECTIO restart ## Control io options during read both under dump and fusion. indexing.read.io enum {NORMAL, DIRECTIO} default=DIRECTIO restart -## Overrides the number of threads used for writing fields across all document dbs. -## See feeding.concurrency for details. -indexing.threads int default=1 restart - ## Option to specify what is most important during indexing. ## This is experimental and will most likely be temporary. indexing.optimize enum {LATENCY, THROUGHPUT, ADAPTIVE} default=THROUGHPUT restart @@ -141,9 +137,6 @@ indexing.optimize enum {LATENCY, THROUGHPUT, ADAPTIVE} default=THROUGHPUT restar ## indexing threads. Only used when visibility delay is zero. indexing.tasklimit int default=-1000 -## Deprecated and ignored, will soon go away -indexing.semiunboundtasklimit int default = 1000 - ## Kind of watermark for when to activate extra manpower ## Utilized if optimize is set to either THROUGHPUT or ADAPTIVE indexing.kind_of_watermark int default = 0 restart @@ -151,7 +144,6 @@ indexing.kind_of_watermark int default = 0 restart ## Controls minimum reaction time in seconds if using THROUGHPUT indexing.reactiontime double default = 0.001 restart - ## How long a freshly loaded index shall be warmed up ## before being used for serving index.warmup.time double default=0.0 restart @@ -169,10 +161,6 @@ index.maxflushed int default=2 ## Setting to 1 will force an immediate fusion. index.maxflushedretired int default=20 -## How much memory is set aside for caching. -## Now only used for caching of dictionary lookups. -index.cache.size long default=0 restart - ## Control io options during flushing of attributes. attribute.write.io enum {NORMAL, OSYNC, DIRECTIO} default=DIRECTIO restart @@ -180,10 +168,12 @@ attribute.write.io enum {NORMAL, OSYNC, DIRECTIO} default=DIRECTIO restart search.mmap.options[] enum {POPULATE, HUGETLB} restart ## Advise to give to os when mapping memory. +## TODO Check if default should be random search.mmap.advise enum {NORMAL, RANDOM, SEQUENTIAL} default=NORMAL restart ## Max number of threads allowed to handle large queries concurrently ## Positive number means there is a limit, 0 or negative means no limit. +## TODO Check if ever used in config. search.memory.limiter.maxthreads int default=0 ## Minimum coverage of corpus to postprocess before applying above concurrency limit. @@ -210,17 +200,6 @@ distribution.searchablecopies long default=1 ## Negative numbers are a percentage of memory. summary.cache.maxbytes long default=-4 -## Include visits in the cache, if the visitoperation allows it. -## This will enable another separate cache of summary.cache.maxbytes size. -## IGNORED and DEPRECATED Will go away soon -summary.cache.allowvisitcaching bool default=true - -## Control number of cache entries preallocated. -## Default is no preallocation. -## Can be set to a higher number to avoid resizing. -## IGNORED and DEPRECATED Will go away soon -summary.cache.initialentries long default=0 restart - ## Control compression type of the summary while in the cache. summary.cache.compression.type enum {NONE, LZ4, ZSTD} default=LZ4 @@ -234,6 +213,7 @@ summary.cache.update_strategy enum {INVALIDATE, UPDATE} default=INVALIDATE ## Control compression type of the summary while in memory during compaction ## NB So far only stragey=LOG honours it. +## TODO Use same as for store (chunk.compression). summary.log.compact.compression.type enum {NONE, LZ4, ZSTD} default=ZSTD ## Control compression level of the summary while in memory during compaction @@ -253,14 +233,11 @@ summary.log.chunk.compression.level int default=9 ## Max size in bytes per chunk. summary.log.chunk.maxbytes int default=65536 -## Skip crc32 check on read. -## IGNORED and DEPRECATED Will go away soon -summary.log.chunk.skipcrconread bool default=false - ## Max size per summary file. summary.log.maxfilesize long default=1000000000 ## Max number of lid entries per file +## TODO Decide based on memory on node. summary.log.maxnumlids int default=40000000 ## Max disk bloat factor. This will trigger compacting. @@ -279,6 +256,7 @@ summary.write.io enum {NORMAL, OSYNC, DIRECTIO} default=DIRECTIO ## Control io options during read of stored documents. ## All summary.read options will take effect immediately on new files written. ## On old files it will take effect either upon compact or on restart. +## TODO Default is probably DIRECTIO summary.read.io enum {NORMAL, DIRECTIO, MMAP } default=MMAP restart ## Multiple optional options for use with mmap @@ -331,6 +309,7 @@ documentdb[].allocation.active_buffers_ratio double default=0.1 periodic.interval double default=3600.0 ## Connect spec for transactionlog server. +## TODO Consider not using RPC at all tlsspec string default="tcp/localhost:13700" restart ## ConfigId for transactionlogserver @@ -424,6 +403,7 @@ visit.ignoremaxbytes bool default=true ## Number of initializer threads used for loading structures from disk at proton startup. ## The threads are shared between document databases when value is larger than 0. ## When set to 0 (default) we use 1 separate thread per document database. +## TODO Consider if really necessary, could be automatic. initialize.threads int default = 0 ## Portion of max address space used in components in attribute vectors @@ -457,10 +437,12 @@ hwinfo.disk.writespeed double default = 200.0 restart ## Amount of data to write to temporary file when sampling disk write speed. ## Default is 1 GiB. +## TODO Check if still in use hwinfo.disk.samplewritesize long default = 1073741824 restart ## Minimum write speed needed to avoid disk being considered slow. ## Unit is MiB/s, default is 100.0 MiB/s. +## TODO Check if still in use hwinfo.disk.slowwritespeedlimit double default = 100.0 restart ## The size of physical memory (in bytes) available to proton. @@ -496,6 +478,7 @@ feeding.niceness double default = 0.0 restart ## This limit is only considered when executing tasks for handling external feed operations. ## In that case the calling thread (persistence thread) is blocked until the master thread has capacity to handle more tasks. ## When this limit is set to 0 it is ignored. +## TODO Check if still in use feeding.master_task_limit int default = 0 ## Adjustment to resource limit when determining if maintenance jobs can run. @@ -513,6 +496,45 @@ maintenancejobs.maxoutstandingmoveops int default=100 ## in depth understanding is present. bucketdb.checksumtype enum {LEGACY, XXHASH64} default = LEGACY restart +## Chooses the throttling policy used to control the window size +## of the SharedOperationThrottler component used by the transaction log replay feed state. +replay_throttling_policy.type enum { UNLIMITED, DYNAMIC } default=DYNAMIC +## Only used if replay_throttling_policy.type == DYNAMIC: +## TODO consider just hardcoding values as they have never been tuned. +replay_throttling_policy.min_window_size int default=100 +replay_throttling_policy.max_window_size int default=10000 +replay_throttling_policy.window_size_increment int default=20 + +## Everything below are deprecated and ignored. Will go away at any time. + +## Deprecated and ignored, will soon go away +indexing.semiunboundtasklimit int default = 1000 + +## Include visits in the cache, if the visitoperation allows it. +## This will enable another separate cache of summary.cache.maxbytes size. +## IGNORED and DEPRECATED Will go away soon +summary.cache.allowvisitcaching bool default=true + +## Control number of cache entries preallocated. +## Default is no preallocation. +## Can be set to a higher number to avoid resizing. +## IGNORED and DEPRECATED Will go away soon +summary.cache.initialentries long default=0 restart + +## Skip crc32 check on read. +## IGNORED and DEPRECATED Will go away soon +summary.log.chunk.skipcrconread bool default=false + +## Overrides the number of threads used for writing fields across all document dbs. +## See feeding.concurrency for details. +## DEPRECATED - Remove usage +indexing.threads int default=1 restart + +## How much memory is set aside for caching. +## Now only used for caching of dictionary lookups. +## TODO Still relevant, check config model, seems unused. +index.cache.size long default=0 restart + ## Specifies which tensor implementation to use for all backend code. ## ## TENSOR_ENGINE (default) uses DefaultTensorEngine, which has been the production implementation for years. @@ -521,12 +543,6 @@ bucketdb.checksumtype enum {LEGACY, XXHASH64} default = LEGACY restart tensor_implementation enum {TENSOR_ENGINE, FAST_VALUE} default = FAST_VALUE ## Whether to report issues back to the container via protobuf field +## TODO Remove always on forward_issues bool default = true -## Chooses the throttling policy used to control the window size -## of the SharedOperationThrottler component used by the transaction log replay feed state. -replay_throttling_policy.type enum { UNLIMITED, DYNAMIC } default=DYNAMIC -## Only used if replay_throttling_policy.type == DYNAMIC: -replay_throttling_policy.min_window_size int default=100 -replay_throttling_policy.max_window_size int default=10000 -replay_throttling_policy.window_size_increment int default=20 |