forked from Watson-Explorer/wex-wdc-integration-samples
-
Notifications
You must be signed in to change notification settings - Fork 0
/
elperiodico-spanish-template.xml
72 lines (65 loc) · 2.52 KB
/
elperiodico-spanish-template.xml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
<source max-elt-id="357" modified-by="data-explorer-admin" name="elperiodico-spanish-template" template="template" modified="1412625878">
<prototype>
<label>El Periodico News in Spanish</label>
<description>
Use this template to create a source that will search the
<a href="http://www.elperiodico.com/">El Periodico News in Spanish</a> website.
</description>
<declare>
<label>Generate key from title</label>
<description>
If false then generate a normal URL-based key for the documents.
If true then generate a key based on normalizing the story's
title.
</description>
<attribute name="name">key-from-title</attribute>
<attribute name="type">boolean</attribute>
<attribute name="initial-value">false</attribute>
</declare>
<declare>
<label>Maximum article age</label>
<description>
Filter articles that are more than this many days old.
Specifying 0 or negative will keep all articles.
</description>
<attribute name="name">max-age</attribute>
<attribute name="type">number</attribute>
<attribute name="initial-value">-1</attribute>
</declare>
</prototype>
<submit>
<form>
<call-function name="standard-form">
<with name="method-value">GET</with>
<with name="action-value">http://www.elperiodico.com/buscador/es/basico</with>
<with name="query-param">q</with>
<with name="per-value">10</with>
<with name="page-param">page</with>
<with name="page-offset">1</with>
<with name="query-syntax">+ OR quotes</with>
<with name="extra-delimiters"><![CDATA[&type=news&fields=PUB_DATE&lang=es&reverse=true]]></with>
</call-function>
</form>
<parser>
<call-function name="xsl-parser">
<with name="results-select">//div[@class='item']</with>
<with name="url-select">h2/a/@href</with>
<with name="title-select">h2/a</with>
<with name="snippet-select">p</with>
<with name="total-results">normalize-space(substring-after( //div[@class='comms_section'], 'de'))</with>
</call-function>
</parser>
</submit>
<tests>
<call-function name="search-test">
<with name="query">killed</with>
<with name="num">20</with>
<with name="min-title-len">10</with>
<with name="max-title-len">100</with>
<with name="title-len-threshold">0</with>
<with name="snippet-len-threshold">0</with>
</call-function>
</tests>
<help />
<description />
</source>