diff options
author | Henning Baldersheim <balder@yahoo-inc.com> | 2019-08-21 07:59:11 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2019-08-21 07:59:11 +0200 |
commit | 415e9e002e4207809247b6bd5f9419960ab43ed1 (patch) | |
tree | 0111e27fb0b3e494401a98279d36c58b48c3d265 /document/src/tests/vespaxml | |
parent | be5759f30affe0e38ea4c442586a457f9cb698f8 (diff) |
Revert "doc: -> id:"
Diffstat (limited to 'document/src/tests/vespaxml')
66 files changed, 690 insertions, 1 deletions
diff --git a/document/src/tests/vespaxml/fieldpathupdates.xml b/document/src/tests/vespaxml/fieldpathupdates.xml index 6c9719a86b9..3b81aaf4ba2 100644..100755 --- a/document/src/tests/vespaxml/fieldpathupdates.xml +++ b/document/src/tests/vespaxml/fieldpathupdates.xml @@ -1,6 +1,6 @@ <!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> <vespafeed> - <update documenttype="news" documentid="id:ns:news::http://www.ntnu.no/"> + <update documenttype="news" documentid="doc:test:http://www.ntnu.no/"> <assign fieldpath="url">assignUrl</assign> <assign fieldpath="title">assignTitle</assign> <assign fieldpath="last_downloaded">1</assign> diff --git a/document/src/tests/vespaxml/test1.expected.xml b/document/src/tests/vespaxml/test1.expected.xml new file mode 100644 index 00000000000..198ed29690d --- /dev/null +++ b/document/src/tests/vespaxml/test1.expected.xml @@ -0,0 +1,5 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<document documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> +</document> diff --git a/document/src/tests/vespaxml/test1.xml b/document/src/tests/vespaxml/test1.xml new file mode 100644 index 00000000000..1ec09a0b61f --- /dev/null +++ b/document/src/tests/vespaxml/test1.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd idprefix="doc:crawler:"> + <document documenttype="news" documentid="http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test10.xml b/document/src/tests/vespaxml/test10.xml new file mode 100644 index 00000000000..832734faf48 --- /dev/null +++ b/document/src/tests/vespaxml/test10.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/"> + <title>Test<Title</title> + <last_downloaded>hundred</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test11.xml b/document/src/tests/vespaxml/test11.xml new file mode 100644 index 00000000000..10daff34be3 --- /dev/null +++ b/document/src/tests/vespaxml/test11.xml @@ -0,0 +1,8 @@ +<?xml version="1.0" encoding="iso-8859-1"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove> + <document type="news" id="doc:crawler/http://www.ntnu���.no/"> + </document> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test12.xml b/document/src/tests/vespaxml/test12.xml new file mode 100644 index 00000000000..3bfd2658404 --- /dev/null +++ b/document/src/tests/vespaxml/test12.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/"> + <title></title> + <last_downloaded></last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test13.xml b/document/src/tests/vespaxml/test13.xml new file mode 100644 index 00000000000..4e55558abc6 --- /dev/null +++ b/document/src/tests/vespaxml/test13.xml @@ -0,0 +1,7 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> + </document> +</vespa> diff --git a/document/src/tests/vespaxml/test14.xml b/document/src/tests/vespaxml/test14.xml new file mode 100644 index 00000000000..8b345f8c654 --- /dev/null +++ b/document/src/tests/vespaxml/test14.xml @@ -0,0 +1,8 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/"> + <last_downloaded>123</last_downloaded> + </doc> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test15.xml b/document/src/tests/vespaxml/test15.xml new file mode 100644 index 00000000000..32707f1636b --- /dev/null +++ b/document/src/tests/vespaxml/test15.xml @@ -0,0 +1,8 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/"> + <title>TestTitle</tit> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test16.xml b/document/src/tests/vespaxml/test16.xml new file mode 100644 index 00000000000..3b3179446e9 --- /dev/null +++ b/document/src/tests/vespaxml/test16.xml @@ -0,0 +1,8 @@ +<?xml version="1.0" encoding="iso-8859-1"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <documentid type="news" id="doc:crawler:http://www.ntnu.no/"> + </documentid> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test17.xml b/document/src/tests/vespaxml/test17.xml new file mode 100644 index 00000000000..aefcc5708e7 --- /dev/null +++ b/document/src/tests/vespaxml/test17.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/1"> + </document> + </vespaadd> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/2"> + </document> + </vespaadd> diff --git a/document/src/tests/vespaxml/test18.xml b/document/src/tests/vespaxml/test18.xml new file mode 100644 index 00000000000..852dd55c134 --- /dev/null +++ b/document/src/tests/vespaxml/test18.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="article" id="doc:crawler/http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test2.expected.xml b/document/src/tests/vespaxml/test2.expected.xml new file mode 100644 index 00000000000..198ed29690d --- /dev/null +++ b/document/src/tests/vespaxml/test2.expected.xml @@ -0,0 +1,5 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<document documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> +</document> diff --git a/document/src/tests/vespaxml/test2.xml b/document/src/tests/vespaxml/test2.xml new file mode 100644 index 00000000000..8194fb1de5e --- /dev/null +++ b/document/src/tests/vespaxml/test2.xml @@ -0,0 +1,7 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <document documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> + </document> +</vespafeed> diff --git a/document/src/tests/vespaxml/test20.xml b/document/src/tests/vespaxml/test20.xml new file mode 100644 index 00000000000..ca502100f67 --- /dev/null +++ b/document/src/tests/vespaxml/test20.xml @@ -0,0 +1,8 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <endoffeed> + <name>default</name> + <generations>10</generations> + <increment>11</increment> + </endoffeed> +</vespafeed> diff --git a/document/src/tests/vespaxml/test21.xml b/document/src/tests/vespaxml/test21.xml new file mode 100644 index 00000000000..45ef52a3e67 --- /dev/null +++ b/document/src/tests/vespaxml/test21.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>21474836480</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test22.xml b/document/src/tests/vespaxml/test22.xml new file mode 100644 index 00000000000..c9f5a0af841 --- /dev/null +++ b/document/src/tests/vespaxml/test22.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <value_long>9223372036854775807</value_long> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test23.xml b/document/src/tests/vespaxml/test23.xml new file mode 100644 index 00000000000..e052c3f2c7f --- /dev/null +++ b/document/src/tests/vespaxml/test23.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <value_long>-9223372036854775807</value_long> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test24.xml b/document/src/tests/vespaxml/test24.xml new file mode 100644 index 00000000000..3d36eea7dc8 --- /dev/null +++ b/document/src/tests/vespaxml/test24.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <value_long>18446744073709551615</value_long> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test25.xml b/document/src/tests/vespaxml/test25.xml new file mode 100644 index 00000000000..9a499195a6b --- /dev/null +++ b/document/src/tests/vespaxml/test25.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/"> + <title>TestTitle</title> + <value_long>18446744073709551616</value_long> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test26.xml b/document/src/tests/vespaxml/test26.xml new file mode 100644 index 00000000000..2d6ae226c68 --- /dev/null +++ b/document/src/tests/vespaxml/test26.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>0x123</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test27.xml b/document/src/tests/vespaxml/test27.xml new file mode 100644 index 00000000000..f8adb8b11f8 --- /dev/null +++ b/document/src/tests/vespaxml/test27.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler/http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>0x123</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test28.xml b/document/src/tests/vespaxml/test28.xml new file mode 100644 index 00000000000..929ba7415d0 --- /dev/null +++ b/document/src/tests/vespaxml/test28.xml @@ -0,0 +1,10 @@ +<!-- Test content --> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title>TestTitleContent</title> + <value_content contenttype="text/html" encoding="utf-8" language="en"><![CDATA[<html><body><h1>This is the title</h1></body></html>]]></value_content> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test29.xml b/document/src/tests/vespaxml/test29.xml new file mode 100644 index 00000000000..1b863e5637e --- /dev/null +++ b/document/src/tests/vespaxml/test29.xml @@ -0,0 +1,18 @@ +<!-- Test field attribute --> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news"> + <field name="uri">doc:crawler:http://www.ntnu.no/</field> + <field name="title">TestTitleContent</field> + <field name="value_content" contenttype="text/html" encoding="UTF-8" language="NO">This is content</field> + <last_downloaded>345</last_downloaded> + </document> + <document type="news"> + <field name="uri">doc:crawler:http://www.ntnu.no/2</field> + <field name="title">TestTitleContent2</field> + <field name="value_content">This is content2</field> + <last_downloaded>345</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test3.xml b/document/src/tests/vespaxml/test3.xml new file mode 100644 index 00000000000..f328115b5ca --- /dev/null +++ b/document/src/tests/vespaxml/test3.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove idprefix="doc:crawler:"> + <documentid type="news"> + <uri>http://www.ntnu.no/</uri> + <last_downloaded></last_downloaded> + </documentid> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test30.xml b/document/src/tests/vespaxml/test30.xml new file mode 100644 index 00000000000..fa24e99cd83 --- /dev/null +++ b/document/src/tests/vespaxml/test30.xml @@ -0,0 +1,15 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed xmlns:xsd="http://www.w3.org/2001/XMLSchema-datatypes" + xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title xsi:type="xsd:hexBinary">E5AEB6E59BADE3808220044BE680AC</title> + <last_downloaded>100</last_downloaded> + </document> + <document type="news" id="doc:crawler:http://www.ntnu.org/"> + <title xsi:type="xsd:base64Binary">5a625Zut44CCIARL5oCs</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> +</vespafeed> + diff --git a/document/src/tests/vespaxml/test32.xml b/document/src/tests/vespaxml/test32.xml new file mode 100644 index 00000000000..53993f57d19 --- /dev/null +++ b/document/src/tests/vespaxml/test32.xml @@ -0,0 +1,7 @@ +<?xml version="1.0" encoding="iso-8859-1"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove> + <documentid id="doc:crawler:http://www.ntnu���.no/"/> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test33.xml b/document/src/tests/vespaxml/test33.xml new file mode 100644 index 00000000000..d63c059aa6e --- /dev/null +++ b/document/src/tests/vespaxml/test33.xml @@ -0,0 +1,9 @@ +<?xml version="1.0" encoding="iso-8859-1"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove> + <documentid> + <uri>http://www.ntnu.no/</uri> + </documentid> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test34.xml b/document/src/tests/vespaxml/test34.xml new file mode 100644 index 00000000000..384c7ae8111 --- /dev/null +++ b/document/src/tests/vespaxml/test34.xml @@ -0,0 +1,7 @@ +<?xml version="1.0" encoding="iso-8859-1"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove> + <documentid id="http://www.ntnu.no/"/> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test35.xml b/document/src/tests/vespaxml/test35.xml new file mode 100644 index 00000000000..e69f032ef49 --- /dev/null +++ b/document/src/tests/vespaxml/test35.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title binaryencoding="base64">VmVzcGEgcnVsZXM=</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test36.xml b/document/src/tests/vespaxml/test36.xml new file mode 100644 index 00000000000..bfd4547b6c8 --- /dev/null +++ b/document/src/tests/vespaxml/test36.xml @@ -0,0 +1,43 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd idprefix="doc:crawler:"> + <document type="news" id="http://www.ntnu.no/1"> + <title>TestTitle1</title> + <last_downloaded>100</last_downloaded> + <stringarr> + <item>one</item> + <item>two</item> + <item>three</item> + <item>four</item> + <item>five</item> + </stringarr> + <intarr> + <item>1</item> + <item>2</item> + <item>3</item> + <item>4</item> + <item>5</item> + </intarr> + </document> + <document type="news" id="http://www.ntnu.no/2"> + <title>TestTitle2</title> + <intarr> + <item>o1</item> + </intarr> + </document> + <document type="news" id="http://www.ntnu.no/3"> + <title>TestTitle3</title> + <intarr> + <tem>1</tem> + </intarr> + </document> + <document type="news" id="http://www.ntnu.no/4"> + <title>TestTitle4</title> + <intarr></intarr> + </document> + <document type="news" id="http://www.ntnu.no/5"> + <title>TestTitle5</title> + <intarr>1</intarr> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test37.xml b/document/src/tests/vespaxml/test37.xml new file mode 100644 index 00000000000..8993dd99640 --- /dev/null +++ b/document/src/tests/vespaxml/test37.xml @@ -0,0 +1,23 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd idprefix="doc:crawler:"> + <document type="news" id="http://www.ntnu.no/1"> + <title>TestTitle1</title> + <last_downloaded>100</last_downloaded> + <weightedsetstring> + <item>one</item> + <item>two</item> + <item>three</item> + <item>four</item> + <item>five</item> + </weightedsetstring> + <weightedsetint> + <item>1</item> + <item>2</item> + <item>3</item> + <item>4</item> + <item>5</item> + </weightedsetint> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test4.xml b/document/src/tests/vespaxml/test4.xml new file mode 100644 index 00000000000..8a4777344d6 --- /dev/null +++ b/document/src/tests/vespaxml/test4.xml @@ -0,0 +1,23 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + + <vespaadd idprefix="doc:crawler:"> + <document type="news" id="http://www.uio.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> + </document> + + <document type="news" id="http://www.dagbladet.no/"> + <title>Title2</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> + + <vespaadd> + <document type="news" id="doc:crawler2:http://www.vg.no/"> + <title>Title2</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> + +</vespafeed> diff --git a/document/src/tests/vespaxml/test40.xml b/document/src/tests/vespaxml/test40.xml new file mode 100644 index 00000000000..68210920df2 --- /dev/null +++ b/document/src/tests/vespaxml/test40.xml @@ -0,0 +1,6 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <update documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <assign field="title">TestTitle</assign> + </update> +</vespafeed> diff --git a/document/src/tests/vespaxml/test41.xml b/document/src/tests/vespaxml/test41.xml new file mode 100644 index 00000000000..b92c2e586a8 --- /dev/null +++ b/document/src/tests/vespaxml/test41.xml @@ -0,0 +1,22 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <update documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <assign field="stringarr"> + <item>First</item> + <item>Second</item> + </assign> + <add field="stringarr"> + <item>Third</item> + <item>Fourth</item> + </add> + <remove field="stringarr"> + <item>Fifth</item> + <item>Sixth</item> + </remove> + <assign field="intarr"> + <item>100</item> + <item>200</item> + </assign> + <assign field="intarr"></assign> + </update> +</vespafeed> diff --git a/document/src/tests/vespaxml/test42.xml b/document/src/tests/vespaxml/test42.xml new file mode 100644 index 00000000000..479509776fa --- /dev/null +++ b/document/src/tests/vespaxml/test42.xml @@ -0,0 +1,22 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <update documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <assign field="weightedsetstring"> + <item weight="1">First</item> + <item weight="2">Second</item> + </assign> + <add field="weightedsetstring"> + <item weight="3">Third</item> + <item weight="4">Fourth</item> + </add> + <remove field="weightedsetstring"> + <item>Fifth</item> + <item>Sixth</item> + </remove> + <assign field="weightedsetint"> + <item weight="1">100</item> + <item weight="2">200</item> + </assign> + <assign field="weightedsetint"></assign> + </update> +</vespafeed> diff --git a/document/src/tests/vespaxml/test43.xml b/document/src/tests/vespaxml/test43.xml new file mode 100644 index 00000000000..874deada10c --- /dev/null +++ b/document/src/tests/vespaxml/test43.xml @@ -0,0 +1,32 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <document documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <value_long>1008</value_long> + <weightedsetstring> + <item weight="1">First</item> + <item weight="2">Second</item> + </weightedsetstring> + </document> + <update documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <increment field="value_long" by="1" /> + <decrement field="value_long" by="2" /> + <divide field="value_long" by="3" /> + <multiply field="value_long" by="4" /> + </update> + <update documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <alter field="value_long"> + <increment by="5" /> + <decrement by="6" /> + </alter> + <alter field="value_long"> + <divide by="7" /> + <multiply by="8" /> + </alter> + </update> + <update documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <increment field="weightedsetstring" by="9"> + <key>First</key> + <key>Second</key> + </increment> + </update> +</vespafeed> diff --git a/document/src/tests/vespaxml/test45.xml b/document/src/tests/vespaxml/test45.xml new file mode 100644 index 00000000000..ccc1a475a86 --- /dev/null +++ b/document/src/tests/vespaxml/test45.xml @@ -0,0 +1,6 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <update documenttype="news" documentid="doc:crawler:http://www.ntnu.no/"> + <remove field="floatarr" /> + </update> +</vespafeed> diff --git a/document/src/tests/vespaxml/test46.xml b/document/src/tests/vespaxml/test46.xml new file mode 100644 index 00000000000..118dfdd810d --- /dev/null +++ b/document/src/tests/vespaxml/test46.xml @@ -0,0 +1,10 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <document documenttype="news" documentid="doc:crawler:http://www.blargh.example.com/" lastmodified="98798787"> + <value_long>1008</value_long> + <weightedsetstring> + <item weight="1">First</item> + <item weight="2">Second</item> + </weightedsetstring> + </document> +</vespafeed> diff --git a/document/src/tests/vespaxml/test47.xml b/document/src/tests/vespaxml/test47.xml new file mode 100644 index 00000000000..e9499c32810 --- /dev/null +++ b/document/src/tests/vespaxml/test47.xml @@ -0,0 +1,10 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- VERY BAD: --> + <vespaadd> + <documentid type="news"> + <uri>doc:this:is:very:bad</uri> + </documentid> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test48.xml b/document/src/tests/vespaxml/test48.xml new file mode 100644 index 00000000000..119d3ea82d4 --- /dev/null +++ b/document/src/tests/vespaxml/test48.xml @@ -0,0 +1,6 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- VERY BAD: --> + <documentid type="news" id="doc:this:is:even:worse" /> +</vespafeed> diff --git a/document/src/tests/vespaxml/test49.xml b/document/src/tests/vespaxml/test49.xml new file mode 100644 index 00000000000..d3fa4dc9637 --- /dev/null +++ b/document/src/tests/vespaxml/test49.xml @@ -0,0 +1,8 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- VERY BAD: --> + <documentid type="news"> + <uri>doc:this:is:very:very:ugly</uri> + </documentid> +</vespafeed> diff --git a/document/src/tests/vespaxml/test5.expected.xml b/document/src/tests/vespaxml/test5.expected.xml new file mode 100644 index 00000000000..5b851a4601e --- /dev/null +++ b/document/src/tests/vespaxml/test5.expected.xml @@ -0,0 +1,3 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<remove documentid="doc:crawler:http://www.ntnu.no/"/> + diff --git a/document/src/tests/vespaxml/test5.xml b/document/src/tests/vespaxml/test5.xml new file mode 100644 index 00000000000..bdfa496cb86 --- /dev/null +++ b/document/src/tests/vespaxml/test5.xml @@ -0,0 +1,6 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove> + <documentid documentid="doc:crawler:http://www.ntnu.no/"/> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test50.xml b/document/src/tests/vespaxml/test50.xml new file mode 100644 index 00000000000..45c4c0a4d13 --- /dev/null +++ b/document/src/tests/vespaxml/test50.xml @@ -0,0 +1,8 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- OK: --> + <vesparemove> + <documentid type="news" id="doc:this:an:ok:removal"/> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test51.xml b/document/src/tests/vespaxml/test51.xml new file mode 100644 index 00000000000..9e91d45d930 --- /dev/null +++ b/document/src/tests/vespaxml/test51.xml @@ -0,0 +1,6 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- OK: --> + <remove documentid="doc:this:is:also:an:ok:removal"/> +</vespafeed> diff --git a/document/src/tests/vespaxml/test52.xml b/document/src/tests/vespaxml/test52.xml new file mode 100644 index 00000000000..a8617df42da --- /dev/null +++ b/document/src/tests/vespaxml/test52.xml @@ -0,0 +1,10 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- OK: --> + <vespaadd> + <document documentid="doc:blah:blah:blah" documenttype="news"> + <value_long>2345</value_long> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test53.xml b/document/src/tests/vespaxml/test53.xml new file mode 100644 index 00000000000..6449436ff54 --- /dev/null +++ b/document/src/tests/vespaxml/test53.xml @@ -0,0 +1,11 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- HALF BAD, BUT NOT ALLOWED: --> + <vespaadd> + <document documentid="doc:blah:blah:blah" documenttype="news"> + <value_long>2345</value_long> + </document> + <documentid type="news" id="doc:half:bad:add"/> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test54.xml b/document/src/tests/vespaxml/test54.xml new file mode 100644 index 00000000000..7535f4b93ea --- /dev/null +++ b/document/src/tests/vespaxml/test54.xml @@ -0,0 +1,10 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- VERY BAD: --> + <vesparemove> + <document documentid="doc:bluh:bluh:bluh" documenttype="news"> + <value_long>45</value_long> + </document> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test55.xml b/document/src/tests/vespaxml/test55.xml new file mode 100644 index 00000000000..b2134a29a46 --- /dev/null +++ b/document/src/tests/vespaxml/test55.xml @@ -0,0 +1,11 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- HALF BAD, BUT NOT ALLOWED: --> + <vesparemove> + <documentid type="news" id="doc:this:remove:is:half:bad"/> + <document documentid="doc:bluh:bluh:bluh" documenttype="news"> + <value_long>45</value_long> + </document> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test56.xml b/document/src/tests/vespaxml/test56.xml new file mode 100644 index 00000000000..1dd36a57b68 --- /dev/null +++ b/document/src/tests/vespaxml/test56.xml @@ -0,0 +1,8 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- VERY BAD: --> + <vesparemove> + <document documentid="doc:bluh:bluh:bluh" documenttype="news" /> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test57.xml b/document/src/tests/vespaxml/test57.xml new file mode 100644 index 00000000000..d75e6d4d099 --- /dev/null +++ b/document/src/tests/vespaxml/test57.xml @@ -0,0 +1,8 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <!-- OK: --> + <document documentid="doc:blih:blih:blih" documenttype="news"> + <value_long>235</value_long> + </document> +</vespafeed> diff --git a/document/src/tests/vespaxml/test58.xml b/document/src/tests/vespaxml/test58.xml new file mode 100644 index 00000000000..8711a2a49e4 --- /dev/null +++ b/document/src/tests/vespaxml/test58.xml @@ -0,0 +1,15 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + + <document type="news" id="doc:music:http://music.yahoo.com"> + <url>http://music.yahoo.com</url> + <stringarr> + <item>yahoo<item> + <item>hello</item> + </stringarr> + </document> + + + +</vespafeed> diff --git a/document/src/tests/vespaxml/test59.xml b/document/src/tests/vespaxml/test59.xml new file mode 100644 index 00000000000..e7708351c93 --- /dev/null +++ b/document/src/tests/vespaxml/test59.xml @@ -0,0 +1,7 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <update documentid="doc:blih:blih:blih" documenttype="news"> + <increment field="title" by="3549" /> + </update> +</vespafeed> diff --git a/document/src/tests/vespaxml/test6.xml b/document/src/tests/vespaxml/test6.xml new file mode 100644 index 00000000000..3739690d2fe --- /dev/null +++ b/document/src/tests/vespaxml/test6.xml @@ -0,0 +1,7 @@ +<?xml version="1.0" encoding="iso-8859-1"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove> + <documentid type="news" id="doc:crawler:http://www.ntnu���.no/"/> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test7.xml b/document/src/tests/vespaxml/test7.xml new file mode 100644 index 00000000000..129773678f1 --- /dev/null +++ b/document/src/tests/vespaxml/test7.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed idprefix="doc:crawler:"> + <vespaadd> + <document type="news" id="http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100.5</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test8.xml b/document/src/tests/vespaxml/test8.xml new file mode 100644 index 00000000000..272791511c1 --- /dev/null +++ b/document/src/tests/vespaxml/test8.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" id="doc:crawler:http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>hundred</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test9.xml b/document/src/tests/vespaxml/test9.xml new file mode 100644 index 00000000000..b733c66a797 --- /dev/null +++ b/document/src/tests/vespaxml/test9.xml @@ -0,0 +1,7 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vesparemove> + <documentid id="doc:crawler/http://www.ntnu���.no/"/> + </vesparemove> +</vespafeed> diff --git a/document/src/tests/vespaxml/test_arraystruct.xml b/document/src/tests/vespaxml/test_arraystruct.xml new file mode 100644 index 00000000000..ba5c3233e16 --- /dev/null +++ b/document/src/tests/vespaxml/test_arraystruct.xml @@ -0,0 +1,19 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <document documenttype="news" documentid="doc:test:struct"> + <mystructarr> + <item> + <intval>36</intval> + <stringval>test</stringval> + </item> + <item> + <intval>39</intval> + <stringval>test2</stringval> + </item> + <item> + <intval>100</intval> + <stringval>cooool</stringval> + </item> + </mystructarr> + </document> +</vespafeed> diff --git a/document/src/tests/vespaxml/test_doc5.xml b/document/src/tests/vespaxml/test_doc5.xml new file mode 100644 index 00000000000..30ce5f7b8f8 --- /dev/null +++ b/document/src/tests/vespaxml/test_doc5.xml @@ -0,0 +1,8 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <endoffeed> + <name>default</name> + <generation>10</generation> + <increment>20</increment> + </endoffeed> +</vespafeed> diff --git a/document/src/tests/vespaxml/test_doc6.xml b/document/src/tests/vespaxml/test_doc6.xml new file mode 100644 index 00000000000..52015073f96 --- /dev/null +++ b/document/src/tests/vespaxml/test_doc6.xml @@ -0,0 +1,6 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <endoffeed> + <name>default</name> + </endoffeed> +</vespafeed> diff --git a/document/src/tests/vespaxml/test_doc8.xml b/document/src/tests/vespaxml/test_doc8.xml new file mode 100644 index 00000000000..f5c7a2090ae --- /dev/null +++ b/document/src/tests/vespaxml/test_doc8.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd> + <document type="news" version="13" id="http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test_externalentity.xml b/document/src/tests/vespaxml/test_externalentity.xml new file mode 100644 index 00000000000..014d67d32bc --- /dev/null +++ b/document/src/tests/vespaxml/test_externalentity.xml @@ -0,0 +1,11 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<!DOCTYPE vespafeed [<!ENTITY xxe SYSTEM "xxe.txt">]> +<vespafeed> + <vespaadd idprefix="doc:crawler:"> + <document documenttype="news" documentid="http://www.ntnu.no/"> + <title>&xxe;</title> + <last_downloaded>100</last_downloaded> + </document> + </vespaadd> +</vespafeed> diff --git a/document/src/tests/vespaxml/test_idprefix.xml b/document/src/tests/vespaxml/test_idprefix.xml new file mode 100644 index 00000000000..2b0487d0b94 --- /dev/null +++ b/document/src/tests/vespaxml/test_idprefix.xml @@ -0,0 +1,13 @@ +<?xml version="1.0" encoding="utf-8"?> +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + + <document type="news" id="http://music.yahoo.com/bobdylan/BestOf"> + <title>Best of Bob Dylan</title> + </document> + + <document type="news" id="http://music.yahoo.com/metallica/BestOf"> + <title>Best of Metallica</title> + </document> + +</vespafeed> diff --git a/document/src/tests/vespaxml/test_struct.xml b/document/src/tests/vespaxml/test_struct.xml new file mode 100644 index 00000000000..251b8b4896d --- /dev/null +++ b/document/src/tests/vespaxml/test_struct.xml @@ -0,0 +1,9 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <document documenttype="news" documentid="doc:test:struct"> + <mystruct> + <intval>36</intval> + <stringval>test</stringval> + </mystruct> + </document> +</vespafeed> diff --git a/document/src/tests/vespaxml/test_update1.xml b/document/src/tests/vespaxml/test_update1.xml new file mode 100644 index 00000000000..89dcb978e3b --- /dev/null +++ b/document/src/tests/vespaxml/test_update1.xml @@ -0,0 +1,12 @@ +<!-- Copyright 2017 Yahoo Holdings. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root. --> +<vespafeed> + <vespaadd idprefix="doc:crawler:"> + <document type="news" id="http://www.ntnu.no/"> + <title>TestTitle</title> + <last_downloaded>100</last_downloaded> + </document> + <update documenttype="news" documentid="http://www.ntnu.no/"> + <divide field="last_downloaded" by="0" /> + </update> + </vespaadd> +</vespafeed> |