aboutsummaryrefslogtreecommitdiffstats
path: root/searchlib/src/vespa/searchlib/attribute/sourceselector.h
blob: 1c1f7ca1a9e96583560461a94c46147e381f9168 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
// Copyright Yahoo. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.

#pragma once

#include "attributememorysavetarget.h"
#include "attributevector.h"
#include <vespa/searchlib/queryeval/isourceselector.h>

namespace search {

class SourceSelector : public queryeval::ISourceSelector
{
private:
protected:
    AttributeVector::SP _realSource;

    queryeval::Source getNewSource(queryeval::Source src, uint32_t diff) {
        return src > diff ? src - diff : 0;
    }

public:
    struct HeaderInfo {
        vespalib::string _baseFileName;
        queryeval::Source _defaultSource;
        uint32_t _baseId;
        uint32_t _docIdLimit;
        HeaderInfo(const vespalib::string & baseFileName,
                   queryeval::Source defaultSource,
                   uint32_t baseId,
                   uint32_t docIdLimit);
    };

    class SaveInfo {
    private:
        HeaderInfo _header;
        AttributeMemorySaveTarget _memSaver;
    public:
        using UP = std::unique_ptr<SaveInfo>;
        using SP = std::shared_ptr<SaveInfo>;
        SaveInfo(const vespalib::string & baseFileName,
                 queryeval::Source defaultSource,
                 uint32_t baseId,
                 uint32_t docIdLimit,
                 AttributeVector & sourceStore);
        ~SaveInfo();
        const HeaderInfo & getHeader() const { return _header; }
        bool save(const TuneFileAttributes &tuneFileAttributes,
                  const search::common::FileHeaderContext &fileHeaderContext);
    };

    class LoadInfo {
    private:
        HeaderInfo _header;
    public:
        using UP = std::unique_ptr<LoadInfo>;
        LoadInfo(const vespalib::string & baseFileName);
        void load();
        const HeaderInfo & header() const { return _header; }
    };

    class Histogram {
    public:
        Histogram() { memset(_h, 0, sizeof(_h)); }
        uint32_t operator [] (queryeval::Source s) const { return _h[s]; }
        void inc(queryeval::Source s) { _h[s]++; }
    private:
        uint32_t _h[256];
    };

public:
    using UP = std::unique_ptr<SourceSelector>;
    SourceSelector(queryeval::Source defaultSource, AttributeVector::SP realSource);
    /**
     * This will compute the distribution of the sources used over the whole lid space.
     */
    Histogram getDistribution() const;
    SaveInfo::UP extractSaveInfo(const vespalib::string & baseFileName);
    static LoadInfo::UP extractLoadInfo(const vespalib::string & baseFileName);

    void setSource(uint32_t docId, queryeval::Source source) override = 0;
    std::unique_ptr<queryeval::sourceselector::Iterator> createIterator() const override = 0;
};

} // namespace search