searchlib/src/vespa/searchlib/predicate/predicate_interval_store.cpp


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112

// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.

#include "predicate_interval_store.h"
#include "predicate_interval.h"
#include <vespa/vespalib/datastore/datastore.hpp>

using vespalib::datastore::BufferState;
using vespalib::datastore::EntryRef;
using std::vector;

namespace search::predicate {

template <typename T>
PredicateIntervalStore::Entry<T> PredicateIntervalStore::allocNewEntry(uint32_t type_id, uint32_t size)
{
    auto result = _store.rawAllocator<T>(type_id).alloc(size);
    return {RefType(result.ref), result.data};
}

PredicateIntervalStore::PredicateIntervalStore()
    : _store(),
      _size1Type(1, 1024u, RefType::offsetSize()),
      _store_adapter(_store),
      _ref_cache(_store_adapter)
{

    // This order determines type ids.
    _store.addType(&_size1Type);

    _store.init_primary_buffers();
}

PredicateIntervalStore::~PredicateIntervalStore() {
    _store.dropBuffers();
}

//
// NOTE: The allocated entries are arrays of type uint32_t, but the
// entries are used as arrays of either Interval or IntervalWithBounds
// objects (PODs). These objects are memcpy'ed into the uint32_t
// arrays, and in the get() function they are typecast back to the
// object expected by the caller. Which type an entry has cannot be
// inferred from the EntryRef, but must be known by the caller.
//
// This saves us from having separate buffers for Intervals and
// IntervalWithBounds objects, since the caller knows the correct type
// anyway.
//
template <typename IntervalT>
EntryRef
PredicateIntervalStore::insert(const vector<IntervalT> &intervals) {
    const uint32_t size = entrySize<IntervalT>() * intervals.size();
    if (size == 0) {
        return EntryRef();
    }
    uint32_t *buffer;
    EntryRef ref;
    if (size == 1 && intervals[0].interval <= RefCacheType::DATA_REF_MASK) {
        return EntryRef(intervals[0].interval);
    }
    uint32_t cached_ref = _ref_cache.find(reinterpret_cast<const uint32_t *>(&intervals[0]), size);
    if (cached_ref) {
        return EntryRef(cached_ref);
    }

    if (size < RefCacheType::MAX_SIZE) {
        auto entry = allocNewEntry<uint32_t>(0, size);
        buffer = entry.buffer;
        ref = EntryRef(entry.ref.ref() | (size << RefCacheType::SIZE_SHIFT));
    } else {
        auto entry = allocNewEntry<uint32_t>(0, size + 1);
        buffer = entry.buffer;
        ref = EntryRef(entry.ref.ref() | RefCacheType::SIZE_MASK);
        *buffer++ = size;
    }
    memcpy(buffer, &intervals[0], size * sizeof(uint32_t));
    _ref_cache.insert(ref.ref());
    return ref;
}
// Explicit instantiation for relevant types.
template
EntryRef PredicateIntervalStore::insert(const vector<Interval> &);
template
EntryRef PredicateIntervalStore::insert(const vector<IntervalWithBounds> &);

void
PredicateIntervalStore::remove(EntryRef ref) {
    if (ref.valid()) {
        uint32_t buffer_id = RefType(ref).bufferId();
        if (buffer_id == 0) {  // single interval optimization.
            return;
        }
        // Don't remove anything.

        // BufferState &state = _store.getBufferState(buffer_id);
        // uint32_t type_id = state.getTypeId();
        // uint32_t size = type_id <= MAX_ARRAY_SIZE ? type_id : 1;
        // _store.hold_entries(ref, size);
    }
}

void
PredicateIntervalStore::reclaim_memory(generation_t oldest_used_gen) {
    _store.reclaim_memory(oldest_used_gen);
}

void
PredicateIntervalStore::assign_generation(generation_t current_gen) {
    _store.assign_generation(current_gen);
}

}