-
Notifications
You must be signed in to change notification settings - Fork 11
/
parse.json
193 lines (193 loc) · 8.04 KB
/
parse.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
{
"opensource.com":{
"title":".pane-node-title > h1:nth-child(1)",
"author":"div.pane-os-content-article-byline:nth-child(3) > div:nth-child(1) > span:nth-child(2) > a:nth-child(1)",
"authorlink":"div.pane-os-content-article-byline:nth-child(3) > div:nth-child(1) > span:nth-child(2) > a:nth-child(1)::attr(href)",
"date":".byline__date",
"summary":".field-name-field-article-subhead > div:nth-child(1) > h2:nth-child(1)",
"content":[".os-article__image > div:nth-child(1) > div:nth-child(1) > div:nth-child(1) > div:nth-child(1)",
".pane-node-body"],
"exclude":[".embedded-callout-menu",".field-name-body > div:nth-child(1) > div:nth-child(1) > .rtecenter",".element-invisible"],
"cleanup_command":"sed 's$<pre>$[code]$g;s$</pre>$[/code]$g'|tidy -q --force-output yes --drop-empty-elements no --drop-empty-paras no --indent no"
},
"www.2daygeek.com":{
"title":"h1.entry-title",
"author":".url",
"authorlink":".url::attr(href)",
"date":".hm-date",
"content":[".entry-content"],
"exclude":[".sharedaddy","noscript"]
},
"www.linuxtechi.com":{
"title":".post-title",
"author":".author",
"authorlink":".author > .fn > a:nth-child(1)::attr(href)",
"date":".published",
"content":[".entry-inner"],
"exclude":[],
"cleanup_command":"sed 's$\\[email protected\\]$root@linuxtechi$g'|tidy -q --force-output yes --drop-empty-elements no --drop-empty-paras no --indent no"
},
"twobithistory.org":{
"title":".post-header > h1:nth-child(1)",
"date":".meta > em:nth-child(1)",
"content":["article"],
"exclude":[],
"cleanup_command":"hxclean"
},
"dave.cheney.net":{
"title":".entry-title",
"date":".entry-date",
"author":".author > .url",
"authorlink":".author > .url::attr(href)",
"content":[".entry-content"],
"exclude":[],
"cleanup_command":"hxclean"
},
"linuxaria.com":{
"title":".entry-title",
"author":"",
"authorlink":"",
"date":".year,.month,.day",
"content":[".entry > p"],
"exclude":[".wp-flattr-button"]
},
"itsfoss.com":{
"title":".post-hero__title",
"author":".post-info__author > a:nth-child(1)",
"authorlink":".post-info__author > a:nth-child(1)::attr(href)",
"date":".post-info__dr > time:nth-child(1)::attr(datetime)",
"content":[".post"],
"exclude":[".apester-unit",".ss-inline-share-wrapper",".ss-hidden-pin-image"],
"cleanup_command":"hxclean"
},
"news.itsfoss.com":{
"title":".c-topper__headline",
"author":".c-topper__byline > a:nth-child(3)",
"authorlink":".c-topper__byline > a:nth-child(3)::attr(href)",
"date":".c-topper__timestamp::attr(datetime)",
"summary":".c-topper__standfirst",
"content":[".c-content"],
"exclude":[".apester-unit","#more-from-its-foss + ul","#more-from-its-foss",".ss-inline-share-wrapper",".ss-hidden-pin-image",".sharedaddy",".jp-relatedposts-i2","aside"],
"cleanup_command":"hxclean"
},
"www.networkworld.com":{
"title":"[itemprop=headline]",
"author":".fn",
"authorlink":"[itemprop=name] > [itemprop=url]::attr(href)",
"date":"[itemprop=datePublished]::attr(content)",
"summary":".deck",
"content":[".lede-container","#drr-container"],
"exclude":[".excerpt-text"]
},
"theartofmachinery.com":{
"title":".entry-title",
"date":".published",
"content":[".entry-content"],
"cleanup_command":"hxclean"
},
"www.zdnet.com":{
"title":".storyHeader > h1:nth-child(1)",
"author":"[itemprop=author]",
"authorlink": "[itemprop=author]::attr(href)",
"date":".meta > time:nth-child(3)::attr(datetime)",
"content":[".storyBody"],
"exclude":[".shortcodeGalleryWrapper"]
},
"jvns.ca":{
"title":".entry-title",
"author":"#wrap > header:nth-child(1) > hgroup:nth-child(1) > h1:nth-child(1) > a:nth-child(1)",
"authorlink":"#wrap > header:nth-child(1) > hgroup:nth-child(1) > h1:nth-child(1) > a:nth-child(1)::attr(href)",
"date":"p.meta:nth-child(3) > time:nth-child(1)::attr(datetime)",
"content":[".entry-content"],
"cleanup_command":"hxclean"
},
"www.jtolio.com":{
"title":".container > div:nth-child(2) > h2:nth-child(2)",
"author":".navbar-brand",
"authorlink":".navbar-brand::attr(href)",
"date":".font-smaller > i:nth-child(1)",
"content":[".container > div:nth-child(3)"],
"cleanup_command":"hxclean"
},
"opensourceforu.com":{
"title":"h1.entry-title",
"author":"div.td-post-author-name > a:nth-child(2)",
"authorlink":"div.td-post-author-name > a:nth-child(2)::attr(href)",
"date":"div.td-post-header > div.td-module-meta-info > span.td-post-date",
"content":[".td-post-content"],
"exclude":[".sharedaddy"]
},
"nicolasparada.netlify.com":{
"title":".container > article:nth-child(1) > h1:nth-child(1)",
"date":".post-dates > time:nth-child(1)",
"content":[".container > article:nth-child(1) > div:nth-child(3)"],
"cleanup_command":"hxclean"
},
"fedoramagazine.org":{
"title":".post-title",
"author":".author",
"authorlink": ".author::attr(href)",
"date":".post-meta-date > a:nth-child(1)",
"content":[".post-image","div.post-content:nth-child(1)"],
"exclude":[".wp-block-separator","div.sharedaddy"]
},
"kerneltalks.com":{
"title":".entry-title",
"author":"",
"date":".entry-time",
"content":[".entry-content"],
"exclude":[".share-filled",".wp-block-separator"]
},
"www.linux.com":{
"title":"h1.entry-title",
"author":".td-post-author-name > a:nth-child(2)",
"authorlink": ".td-post-author-name > a:nth-child(2)::attr(href)",
"date":".td-post-date",
"content":[".td-post-featured-image",".td-post-content"],
"cleanup_command":"tidy -q --force-output yes --drop-empty-elements no --drop-empty-paras no --indent no|pandoc -t html -f html"
},
"leebriggs.co.uk":{
"title":".post-title",
"author":".site-footer > p:nth-child(1) > a:nth-child(1)",
"authorlink":".site-footer > p:nth-child(1) > a:nth-child(1)::attr(href)",
"date":".post-meta > time:nth-child(5)::attr(datetime)",
"content":[".post-content"],
"exclude":[],
"cleanup_command":"hxclean"
},
"theartofmachinery.com":{
"title":".entry-title",
"author":"",
"authorlink":"",
"date":".published::attr(datetime)",
"content":[".entry-content"],
"exclude":[],
"cleanup_command":"hxclean"
},
"www.ostechnix.com":{
"title":".post-title",
"author":".fn > a:nth-child(1)",
"date":".published",
"content":[".image-container",".entry-inner"],
"exclude":[".after-post-box",".sharedaddy"]
},
"jao.io":{
"title":".post-title",
"author":"#postamble > center:nth-child(1) > a:nth-child(4)",
"authorlink":"#postamble > center:nth-child(1) > a:nth-child(4)::attr(href)",
"date":".post-date",
"content":["#content"],
"exclude":[".post-title",".post-date"],
"cleanup_command":"hxclean"
},
"www.debugpoint.com":{
"title":"h1.entry-title",
"author":"h3.auth-name > a:nth-child(2) > span:nth-child(1)",
"authorlink":"h3.auth-name > a.auth-url::attr(href)",
"date":"time.published",
"summary":".s-post-content > p:nth-child(5)",
"content":[".s-post-content"],
"exclude":[".s-post-content > p > strong:first-child", ".s-post-content > p:last-of-type", ".s-post-content > a:last-of-type", "#also-read"],
"cleanup_command":"tidy -q --force-output yes --drop-empty-elements no --drop-empty-paras no --indent no"
}
}