forked from abadojack/swot
-
Notifications
You must be signed in to change notification settings - Fork 1
/
swot.go
126 lines (106 loc) · 2.52 KB
/
swot.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
// Package swot finds academic domains and emails
//go:generate broccoli -src domains
package swot
import (
"errors"
"io/ioutil"
"net/url"
"path/filepath"
"strings"
valid "github.com/asaskevich/govalidator"
)
var (
// ErrDomainNotFound happens when a domain is not found
ErrDomainNotFound = errors.New("Domain name not found")
// ErrSchoolNotFound happens whan a school name is not found
ErrSchoolNotFound = errors.New("School name not found")
)
func isBlacklisted(domain string) bool {
for _, blacklisted := range blacklist {
if strings.HasSuffix(domain, blacklisted) {
return true
}
}
return false
}
func isAcademicTLD(domain string) bool {
for _, tld := range tlds {
if strings.HasSuffix(domain, tld) {
return true
}
}
return false
}
func parseDomain(address string) (string, error) {
address = strings.ToLower(strings.TrimSpace(address))
switch {
case valid.IsEmail(address):
return strings.Split(address, "@")[1], nil
case valid.IsURL(address):
if valid.IsRequestURL(address) {
url, err := url.Parse(address)
if err != nil {
return "", err
}
return strings.Split(url.Host, ":")[0], nil
}
return address, nil
}
return "", ErrDomainNotFound
}
func fileExists(path string) bool {
if _, err := br.Stat(path); err == nil {
return true
}
return false
}
func getInstitutionName(address string) (string, error) {
domain, err := parseDomain(address)
if err != nil {
return "", err
}
domainParts := splitdomain(domain)
path := "domains"
for i := len(domainParts) - 1; i >= 0; i-- {
path = filepath.Join(path, domainParts[i])
if fileExists(path + ".txt") {
f, err := br.Open(path + ".txt")
if err != nil {
return "", err
}
b, err := ioutil.ReadAll(f)
if err != nil {
return "", err
}
return string(b), nil
}
}
return "", ErrSchoolNotFound
}
func splitdomain(domain string) []string {
return strings.Split(domain, ".")
}
// IsAcademic returns true if the email address or URL belongs
// to an academic institution.
func IsAcademic(address string) bool {
domain, err := parseDomain(address)
if err != nil {
return false
}
if isBlacklisted(domain) {
return false
} else if isAcademicTLD(domain) {
return true
}
_, err = getInstitutionName(domain)
return err == nil
}
// GetSchoolName returns the name of the academic institution or
// an empty string if the name of the institution is not found.
func GetSchoolName(address string) string {
s, err := getInstitutionName(address)
if err != nil {
return ""
}
return strings.TrimSpace(s)
}