-
Notifications
You must be signed in to change notification settings - Fork 0
/
pics.go
87 lines (77 loc) · 1.84 KB
/
pics.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
package extractor
import (
"io"
"net/http"
"sort"
"sync"
"time"
"github.com/PuerkitoBio/goquery"
log "github.com/go-pkgz/lgr"
)
func (f UReadability) extractPics(iselect *goquery.Selection, url string) (mainImage string, allImages []string, ok bool) {
images := make(map[int]string)
type imgInfo struct {
url string
size int
}
var resCh = make(chan imgInfo)
var wg sync.WaitGroup
iselect.Each(func(_ int, s *goquery.Selection) {
if im, ok := s.Attr("src"); ok {
wg.Add(1)
go func(url string) {
size := f.getImageSize(url)
resCh <- imgInfo{url: url, size: size}
wg.Done()
}(im)
}
})
go func() {
wg.Wait()
close(resCh)
}()
for r := range resCh {
images[r.size] = r.url
allImages = append(allImages, r.url)
}
sort.Strings(allImages)
if len(images) == 0 {
return "", nil, false
}
// get the biggest picture
keys := make([]int, 0, len(images))
for k := range images {
keys = append(keys, k)
}
sort.Sort(sort.Reverse(sort.IntSlice(keys)))
mainImage = images[keys[0]]
log.Printf("[DEBUG] total images from %s = %d, main=%s (%d)", url, len(images), mainImage, keys[0])
return mainImage, allImages, true
}
// getImageSize loads image to get size
func (f UReadability) getImageSize(url string) (size int) {
httpClient := &http.Client{Timeout: time.Second * 30}
req, err := http.NewRequest("GET", url, nil)
if err != nil {
log.Printf("[WARN] can't create request to get pic from %s", url)
return 0
}
req.Close = true
req.Header.Set("User-Agent", userAgent)
resp, err := httpClient.Do(req)
if err != nil {
log.Printf("[WARN] can't get %s, error=%v", url, err)
return 0
}
defer func() {
if err = resp.Body.Close(); err != nil {
size = 0
}
}()
data, err := io.ReadAll(resp.Body)
if err != nil {
log.Printf("[WARN] failed to get %s, err=%v", url, err)
return 0
}
return len(data)
}