aboutsummaryrefslogtreecommitdiffstats
path: root/searchlib/src/vespa/searchlib/attribute/posting_list_merger.cpp
blob: 877d1c4fcd21b7b934e2a92d1fdcdf6bb9014e5c (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.

#include "posting_list_merger.h"
#include <algorithm>

namespace search::attribute {

template <typename DataT>
PostingListMerger<DataT>::PostingListMerger(uint32_t docIdLimit) noexcept
    : _array(),
      _startPos(),
      _bitVector(),
      _docIdLimit(docIdLimit),
      _arrayValid(false)
{
}

template <typename DataT>
PostingListMerger<DataT>::~PostingListMerger() = default;

template <typename DataT>
void
PostingListMerger<DataT>::reserveArray(uint32_t postingsCount, size_t postingsSize)
{
    _array.reserve(postingsSize);
    _startPos.reserve(postingsCount + 1);
    _startPos.push_back(0);
}


template <typename DataT>
void
PostingListMerger<DataT>::allocBitVector()
{
    _bitVector = BitVector::create(_docIdLimit);
}

template <typename DataT>
void
PostingListMerger<DataT>::merge()
{
    if (_bitVector) {
        _bitVector->invalidateCachedCount();
    } else {
        if (_startPos.size() > 2) {
            PostingVector temp(_array.size());
            _array.swap(merge(_array, temp, _startPos));
        }
        StartVector().swap(_startPos);
        _arrayValid = true;
    }
}


template <typename DataT>
typename PostingListMerger<DataT>::PostingVector &
PostingListMerger<DataT>::merge(PostingVector &v, PostingVector &temp, const StartVector &startPos)
{
    StartVector nextStartPos;
    nextStartPos.reserve((startPos.size() + 1) / 2);
    nextStartPos.push_back(0);
    for (size_t i(0), m((startPos.size() - 1) / 2); i < m; i++) {
        size_t aStart = startPos[i * 2 + 0];
        size_t aEnd = startPos[i * 2 + 1];
        size_t bStart = aEnd;
        size_t bEnd = startPos[i * 2 + 2];
        auto it = v.begin();
        std::merge(it + aStart, it + aEnd,
                   it + bStart, it + bEnd,
                   temp.begin() + aStart);
        nextStartPos.push_back(bEnd);
    }
    if ((startPos.size() - 1) % 2) {
        for (size_t i(startPos[startPos.size() - 2]), m(v.size()); i < m; i++) {
            temp[i] = v[i];
        }
        nextStartPos.push_back(temp.size());
    }
    return (nextStartPos.size() > 2) ? merge(temp, v, nextStartPos) : temp;
}


template class PostingListMerger<vespalib::btree::BTreeNoLeafData>;
template class PostingListMerger<int32_t>;

}