blob: 1524e7480a0b2a582e031a1c37a6ae5c17e79982 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
|
search sombrerowebdoc {
document sombrerowebdoc {
version : 0
struct sombreroattribute {
field attributetype type int {}
field intvalue type int {}
field huffmanindex type int {}
field lexicon type string {}
field name type string {}
field strvalue type string {}
}
annotation sombreroTOKEN { }
annotation sombreroPHRASE {
field prefixused type int {}
field suffixused type int {}
field attributes type array<sombreroattribute> {}
field annotationreferences type array<annotationreference<sombreroTOKEN>> {}
}
struct sombrerocontentfilter {
field id type string {}
field value type string {}
}
struct sombrerorule {
field name type string {}
field location type string {}
field contentfilters type array<sombrerocontentfilter> {}
}
struct sombrerometrics {
field executiontime type double {}
}
struct sombreroextraction {
field adjuncts type string {}
field metrics type sombrerometrics {}
field status type string {}
}
field url type string {}
field raw_html type string {}
field decoded_html type string {}
field rules type array<sombrerorule> {}
field extraction type sombreroextraction {}
field content_language type string {}
field dupdetectshinglesketch type string {}
field mlprisma type string {}
field raw_bytes type raw {}
field charset_encoding type string {}
field meta_language type string {}
field language type string {}
field region type string {}
}
}
|