-
Notifications
You must be signed in to change notification settings - Fork 0
/
tmpfile
119 lines (96 loc) · 2.03 KB
/
tmpfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
package main
import (
"fmt"
"io"
"io/ioutil"
"net/http"
"os"
"regexp"
"strconv"
"strings"
"time"
)
var (
regHref = `((ht|f)tps?)://[w]{0,3}.baidu.com/link\?[a-zA-z=0-9-\s]*`
)package main
import (
"fmt"
"io/ioutil"
"net/http"
"os"
"regexp"
"time"
"strings"
)
var (
urls = []string{}
sourceCode =[]string{}
)
func main() {
fistStart()
for _,u := range urls{
getSource("http://etherscan.io"+u)
}
for _,k := range sourceCode{
fmt.Println("ETH sourceCode:")
fmt.Println(k)
}
}
func getSource(url string){
fmt.Println("Geting ",url,"SourceCode")
resp, err := http.Get(url)
if err != nil{
fmt.Println(err)
return
}
defer resp.Body.Close()
body, _ := ioutil.ReadAll(resp.Body)
reg := regexp.MustCompile(`top: 5px;'>(?s:(.*?))</pre><br><script>`)
result := reg.FindAllString(string(body),-1)
for i:=0;i<len(result);i++{
result[i] = strings.TrimLeft(result[i],"top: 5px;'>")
result[i] = strings.TrimRight(result[i],"</pre><br><script>")
}
sourceCode = append(sourceCode, result...)
}
func fistStart() {
url := "http://etherscan.io/contractsVerified"
resp, _ := http.Get(url)
defer resp.Body.Close()
body, _ := ioutil.ReadAll(resp.Body)
fmt.Println(string(body))
reg := regexp.MustCompile(`/address/[a-zA-z=0-9-\s]*`)
for _, d := range reg.FindAllString(string(body), -1) {
fmt.Println("地址收集: ", d)
urls = append(urls, d)
// fmt.Print(string(file))
}
fmt.Println("\n首次收集网络地址:" ,len(urls))
}
func checkRegexp(cont string, reg string, style int) (result interface{}) {
check := regexp.MustCompile(reg)
switch style {
case 0:
result = check.FindString(cont)
case 1:
result = check.FindAllString(cont, -1)
default:
result = check.FindAll([]byte(cont), -1)
}
return
}
func Timer() {
t := time.NewTimer(time.Second * 1)
<-t.C
fmt.Print("\n\n\n执行爬抓\n\n")
Timer()
}
func checkFile(dir string, file string) os.FileInfo {
list, _ := ioutil.ReadDir(dir)
for _, info := range list {
if info.Name() == file {
return info
}
}
return list[0]
}