/
maoyan.js
70 lines (57 loc) · 1.55 KB
/
maoyan.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
const Axios = require('axios')
const fs = require('fs')
const path = require('path')
const GROUP_END = 10
async function getOnePage(url) {
try {
let headers = {
'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.162 Safari/537.36'
}
let response = await Axios.get(url, { headers })
if(response.status === 200) {
return response.data
}
return
} catch (error) {
return
}
}
function parseOnePage(html) {
let re = /<dd>(?:\s.*?)*board-index.*?>(\d+)<\/i>(?:\s.*?)*data-src="(.*?)"(?:\s.*?)*name"><a.*?>(.*?)<\/a><\/p>\s*?<p class="star">\s*?(.*?)\s*?<\/p>(?:\s.*?)*releasetime">(.*?)<\/p>(?:\s.*?)*integer">(.*?)<\/i>.*?fraction">(.*?)<\/i>/g
let arr = []
let item
while (item = re.exec(html)) {
item.splice(0 ,1)
arr.push({
'index': item[0],
'image': item[1],
'title': item[2],
'actor': item[3],
'time': item[4],
'score': item[5] + item[6]
})
}
return arr
}
async function writeToFile(content) {
return new Promise((response, reject) => {
fs.appendFile('./MaoYan/result.txt', JSON.stringify(content) + '\n', (err) => {
if(err) return reject()
response()
})
})
}
async function main(offset) {
let url = `http://maoyan.com/board/4?offset=${offset}`
let html = await getOnePage(url)
for(let item of parseOnePage(html)) {
await writeToFile(item)
}
}
let groups = []
for(let i = 0; i < GROUP_END; i++){
groups.push(i*10)
}
groups.forEach(offset => {
main(offset)
})