vespalib/src/tests/sequencedtaskexecutor/sequencedtaskexecutor_benchmark.cpp


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73

// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.

#include <vespa/vespalib/util/sequencedtaskexecutor.h>
#include <vespa/vespalib/util/adaptive_sequenced_executor.h>
#include <vespa/vespalib/util/lambdatask.h>
#include <vespa/vespalib/util/time.h>
#include <atomic>
#include <cinttypes>

using vespalib::ISequencedTaskExecutor;
using vespalib::SequencedTaskExecutor;
using vespalib::AdaptiveSequencedExecutor;
using ExecutorId = vespalib::ISequencedTaskExecutor::ExecutorId;

size_t do_work(size_t size) {
    size_t ret = 0;
    for (size_t i = 0; i < size; ++i) {
        for (size_t j = 0; j < 128; ++j) {
            ret = (ret + i) * j;
        }
    }
    return ret;
}

struct SimpleParams {
    int argc;
    char **argv;
    int idx;
    SimpleParams(int argc_in, char **argv_in) : argc(argc_in), argv(argv_in), idx(0) {}
    int next(const char *name, int fallback) {
        ++idx;
        int value = 0;
        if (argc > idx) {
            value = atoi(argv[idx]);
        } else {
            value = fallback;
        }
        fprintf(stderr, "param %s: %d\n", name, value);
        return value;
    }
};

VESPA_THREAD_STACK_TAG(sequenced_executor)

int main(int argc, char **argv) {
    SimpleParams params(argc, argv);
    bool use_adaptive_executor = params.next("use_adaptive_executor", 0);
    bool optimize_for_throughput = params.next("optimize_for_throughput", 0);
    size_t num_tasks = params.next("num_tasks", 1000000);
    size_t num_strands = params.next("num_strands", 4);
    size_t task_limit = params.next("task_limit", 1000);
    size_t num_threads = params.next("num_threads", num_strands);
    size_t max_waiting = params.next("max_waiting", optimize_for_throughput ? 32 : 0);
    size_t work_size = params.next("work_size", 0);
    std::atomic<long> counter(0);
    std::unique_ptr<ISequencedTaskExecutor> executor;
    if (use_adaptive_executor) {
        executor = std::make_unique<AdaptiveSequencedExecutor>(num_strands, num_threads, max_waiting, task_limit, true);
    } else {
        auto optimize = optimize_for_throughput
                        ? vespalib::Executor::OptimizeFor::THROUGHPUT
                        : vespalib::Executor::OptimizeFor::LATENCY;
        executor = SequencedTaskExecutor::create(sequenced_executor, num_strands, task_limit, true, optimize);
    }
    vespalib::Timer timer;
    for (size_t task_id = 0; task_id < num_tasks; ++task_id) {
        executor->executeTask(ExecutorId(task_id % num_strands),
                              vespalib::makeLambdaTask([&counter,work_size] { (void) do_work(work_size); counter++; }));
    }
    executor.reset();
    fprintf(stderr, "\ntotal time: %" PRId64 " ms\n", vespalib::count_ms(timer.elapsed()));
    return (size_t(counter) == num_tasks) ? 0 : 1;
}