aboutsummaryrefslogtreecommitdiffstats
path: root/vespa-documentgen-plugin/etc/complex/sombrerowebdoc.sd.FOO
blob: 1524e7480a0b2a582e031a1c37a6ae5c17e79982 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
search sombrerowebdoc {

  document sombrerowebdoc {
    version : 0

  struct sombreroattribute {
    field attributetype type int {}
    field intvalue      type int {}
    field huffmanindex  type int {}
    field lexicon       type string {}
    field name          type string {}
    field strvalue      type string {}
  }

  annotation sombreroTOKEN { }

  annotation sombreroPHRASE {
    field prefixused           type int {}
    field suffixused           type int {}
    field attributes           type array<sombreroattribute> {}
    field annotationreferences type array<annotationreference<sombreroTOKEN>> {}
  }

  struct sombrerocontentfilter {
    field id    type string {}
    field value type string {}
  }

  struct sombrerorule {
    field name           type string {}
    field location       type string {}
    field contentfilters type array<sombrerocontentfilter> {}
  }

  struct sombrerometrics {
    field executiontime type double {}
  }

  struct sombreroextraction {
    field adjuncts type string {}
    field metrics  type sombrerometrics {}
    field status   type string {}
  }


    field url type string {}

    field raw_html type string {}

    field decoded_html type string {}

    field rules type array<sombrerorule> {}

    field extraction type sombreroextraction {}

    field content_language type string {}

    field dupdetectshinglesketch type string {}

    field mlprisma type string {}

    field raw_bytes type raw {}

    field charset_encoding type string {}

    field meta_language type string {}

    field language type string {}

    field region type string {}

  }
}