summaryrefslogtreecommitdiffstats
path: root/searchlib/src/tests/features/util/util_test.cpp
blob: e51eb8e77b87d50af184fec2e6d11311d6be563c (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
#include <vespa/searchlib/features/utils.h>
#include <vespa/searchlib/fef/test/indexenvironment.h>
#include <vespa/searchlib/fef/test/queryenvironment.h>
#include <vespa/vespalib/gtest/gtest.h>

using namespace search;
using namespace search::fef;
using namespace search::fef::test;
using namespace search::features;
using namespace search::features::util;

namespace search::features::util {

void PrintTo(const DocumentFrequency& document_frequency, std::ostream* os) {
    *os << "{" << document_frequency.frequency << "," << document_frequency.count << "}";
}

}

SimpleTermData make_term(uint32_t uid) {
    SimpleTermData term;
    term.setUniqueId(uid);
    return term;
}

struct TermLabelFixture {
    IndexEnvironment indexEnv;
    QueryEnvironment queryEnv;
    TermLabelFixture() : indexEnv(), queryEnv(&indexEnv) {
        queryEnv.getTerms().push_back(make_term(5));
        queryEnv.getTerms().push_back(make_term(0));
        queryEnv.getTerms().push_back(make_term(10));
        queryEnv.getProperties().add("vespa.label.foo.id", "5");
        queryEnv.getProperties().add("vespa.label.bar.id", "0"); // undefined uid
        queryEnv.getProperties().add("vespa.label.baz.id", "10");
        queryEnv.getProperties().add("vespa.label.fox.id", "7"); // non-existing
    }
};

TEST(UtilsTest, require_that_label_can_be_mapped_to_term)
{
    TermLabelFixture f1;
    EXPECT_EQ((ITermData*)&f1.queryEnv.getTerms()[0], getTermByLabel(f1.queryEnv, "foo"));
    EXPECT_EQ((ITermData*)0, getTermByLabel(f1.queryEnv, "bar"));
    EXPECT_EQ((ITermData*)&f1.queryEnv.getTerms()[2], getTermByLabel(f1.queryEnv, "baz"));
    EXPECT_EQ((ITermData*)0, getTermByLabel(f1.queryEnv, "fox"));
    EXPECT_EQ((ITermData*)0, getTermByLabel(f1.queryEnv, "unknown"));
}

template <typename T>
void verifyStrToNum(const std::string& label) {
    SCOPED_TRACE(label);
    EXPECT_EQ(-17, static_cast<long>(strToNum<T>("-17")));
    EXPECT_EQ(-1, static_cast<long>(strToNum<T>("-1")));
    EXPECT_EQ(0, static_cast<long>(strToNum<T>("0")));
    EXPECT_EQ(1, static_cast<long>(strToNum<T>("1")));
    EXPECT_EQ(17, static_cast<long>(strToNum<T>("17")));
    EXPECT_EQ(0, static_cast<long>(strToNum<T>("0x0")));
    EXPECT_EQ(1, static_cast<long>(strToNum<T>("0x1")));
    EXPECT_EQ(27, static_cast<long>(strToNum<T>("0x1b")));
}

TEST(UtilsTest, verify_str2Num)
{
    verifyStrToNum<int8_t>("int8_t");
    verifyStrToNum<int16_t>("int16_t");
    verifyStrToNum<int32_t>("int32_t");
    verifyStrToNum<int64_t>("int64_t");
}

TEST(UtilsTest, lookup_document_frequency)
{
    using OptDF = std::optional<DocumentFrequency>;
    IndexEnvironment index_env;;
    QueryEnvironment query_env(&index_env);
    query_env.getTerms() = std::vector<SimpleTermData>{make_term(0), make_term(5), make_term(6), make_term(10)};
    // Properties not used due to bad unique id
    query_env.getProperties().add("vespa.term.0.docfreq", "11");
    query_env.getProperties().add("vespa.term.0.docfreq", "17");
    // Incomplete properties, thus not used
    query_env.getProperties().add("vespa.term.6.docfreq", "5");
    // Complete properties
    query_env.getProperties().add("vespa.term.10.docfreq", "10");
    query_env.getProperties().add("vespa.term.10.docfreq", "15");
    EXPECT_EQ(OptDF(), lookup_document_frequency(query_env, 0)); // bad unique id
    EXPECT_EQ(OptDF(), lookup_document_frequency(query_env, 1)); // missing properties
    EXPECT_EQ(OptDF(), lookup_document_frequency(query_env, 2)); // incomplete properties
    EXPECT_EQ(OptDF({10, 15}), lookup_document_frequency(query_env, 3));
    EXPECT_EQ(OptDF(), lookup_document_frequency(query_env, 4)); // term not found
}

GTEST_MAIN_RUN_ALL_TESTS()