1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
|
// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
#include "documenttypemapping.h"
#include <vespa/document/repo/documenttyperepo.h>
#include <vespa/document/datatype/documenttype.h>
#include <vespa/vespalib/stllike/hash_map.hpp>
#include <vespa/log/log.h>
LOG_SETUP(".vsm.common.documenttypemapping");
namespace vsm {
DocumentTypeMapping::DocumentTypeMapping() :
_fieldMap(),
_defaultDocumentTypeName(),
_defaultDocumentType(),
_documentTypeFreq()
{ }
DocumentTypeMapping::~DocumentTypeMapping() { }
namespace {
vespalib::string getDocTypeId(const document::DocumentType & docType)
{
vespalib::string typeId(docType.getName());
typeId += "0"; // Hardcoded version (version not supported)
return typeId;
}
}
void DocumentTypeMapping::init(const vespalib::string & defaultDocumentType,
const StringFieldIdTMapT & fieldList,
const document::DocumentTypeRepo &repo)
{
_defaultDocumentType = repo.getDocumentType(defaultDocumentType);
_defaultDocumentTypeName = getDocTypeId(*_defaultDocumentType);
LOG(debug, "Setting default document type to '%s'",
_defaultDocumentTypeName.c_str());
buildFieldMap(_defaultDocumentType, fieldList, _defaultDocumentTypeName);
}
bool DocumentTypeMapping::prepareBaseDoc(SharedFieldPathMap & map) const
{
auto found = _fieldMap.find(_defaultDocumentTypeName);
if (found != _fieldMap.end()) {
map = std::make_shared<FieldPathMapT>(found->second);
LOG(debug, "Found FieldPathMap for default document type '%s' with %zd elements",
_defaultDocumentTypeName.c_str(), map->size());
} else {
LOG(warning, "No FieldPathMap found for default document type '%s'. Using empty one",
_defaultDocumentTypeName.c_str());
map = std::make_shared<FieldPathMapT>();
}
return true;
}
void DocumentTypeMapping::buildFieldMap(
const document::DocumentType *docTypePtr,
const StringFieldIdTMapT & fieldList, const vespalib::string & typeId)
{
LOG(debug, "buildFieldMap: docType = '%s', fieldList.size = '%zd', typeId = '%s'",
docTypePtr->getName().c_str(), fieldList.size(), typeId.c_str());
const document::DocumentType & docType = *docTypePtr;
size_t highestFNo(0);
for (const auto& elem : fieldList) {
highestFNo = std::max(highestFNo, size_t(elem.second));
}
highestFNo++;
FieldPathMapT & fieldMap = _fieldMap[typeId];
fieldMap.resize(highestFNo);
size_t validCount(0);
for (const auto& elem : fieldList) {
vespalib::string fname = elem.first;
LOG(debug, "Handling %s -> %d", fname.c_str(), elem.second);
try {
if ((elem.first[0] != '[') && (elem.first != "summaryfeatures") && (elem.first != "rankfeatures") && (elem.first != "ranklog") && (elem.first != "sddocname") && (elem.first != "documentid")) {
FieldPath fieldPath;
docType.buildFieldPath(fieldPath, fname);
fieldMap[elem.second] = std::move(fieldPath);
validCount++;
LOG(spam, "Found %s -> %d in document", fname.c_str(), elem.second);
}
} catch (const std::exception & e) {
LOG(debug, "Could not get field info for '%s' in documenttype '%s' (id = '%s') : %s",
elem.first.c_str(), docType.getName().c_str(), typeId.c_str(), e.what());
}
}
_documentTypeFreq.insert(std::make_pair(validCount, docTypePtr));
}
const document::DocumentType & DocumentTypeMapping::getCurrentDocumentType() const
{
if (_documentTypeFreq.empty()) {
throw std::runtime_error("No document type registered yet.");
}
return *_documentTypeFreq.rbegin()->second;
}
}
|