-
Notifications
You must be signed in to change notification settings - Fork 0
/
parser_5.py
45 lines (31 loc) · 1.02 KB
/
parser_5.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
import requests
import csv
# парсинг (ajax)
def get_html(url):
r = requests.get(url)
return r.text
def write_csv(data):
with open('websites.csv', 'a') as f:
order = ['name', 'url', 'description', 'traffic', 'percent']
writer = csv.DictWriter(f, fieldnames=order)
writer.writerow(data)
def main():
for i in range(0, 6428):
url = 'https://www.liveinternet.ru/rating/ru//today.tsv?page={}'.format(str(i))
response = get_html(url)
data = response.strip().split('\n')[1:]
for row in data:
columns = row.strip().split('\t')
name = columns[0]
url = columns[1]
description = columns[2]
traffic = columns[3]
percent = columns[4]
data = {'name': name,
'url': url,
'description': description,
'traffic': traffic,
'percent': percent}
write_csv(data)
if __name__ == '__main__':
main()