forked from iawia002/lux
/
douyin.go
90 lines (77 loc) 路 1.79 KB
/
douyin.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
package douyin
import (
"encoding/json"
"errors"
"fmt"
"github.com/maseer/annie/extractors/types"
"github.com/maseer/annie/request"
"github.com/maseer/annie/utils"
)
type data struct {
ItemList []struct {
Desc string `json:"desc"`
} `json:"item_list"`
}
type extractor struct{}
// New returns a youtube extractor.
func New() types.Extractor {
return &extractor{}
}
// Extract is the main function to extract the data.
func (e *extractor) Extract(url string, option types.Options) ([]*types.Data, error) {
var err error
html, err := request.Get(url, url, nil)
if err != nil {
return nil, err
}
realURLs := utils.MatchOneOf(html, `playAddr: "(.+?)"`)
if realURLs == nil || len(realURLs) < 2 {
return nil, types.ErrURLParseFailed
}
realURL := realURLs[1]
size, err := request.Size(realURL, url)
if err != nil {
return nil, err
}
urlData := &types.Part{
URL: realURL,
Size: size,
Ext: "mp4",
}
streams := map[string]*types.Stream{
"default": {
Parts: []*types.Part{urlData},
Size: size,
},
}
videoIDs := utils.MatchOneOf(url, `/video/(\d+)`)
if len(videoIDs) == 0 {
return nil, errors.New("unable to get video ID")
}
videoID := videoIDs[1]
dytks := utils.MatchOneOf(html, `dytk: "(.+?)"`)
if len(dytks) == 0 {
return nil, errors.New("unable to get dytk info")
}
dytk := dytks[1]
apiDataString, err := request.Get(
fmt.Sprintf("https://www.douyin.com/web/api/v2/aweme/iteminfo/?item_ids=%s&dytk=%s", videoID, dytk),
url, nil,
)
if err != nil {
return nil, err
}
var apiData data
if err = json.Unmarshal([]byte(apiDataString), &apiData); err != nil {
return nil, err
}
return []*types.Data{
{
Site: "鎶栭煶 douyin.com",
Title: apiData.ItemList[0].Desc,
Type: types.DataTypeVideo,
Streams: streams,
URL: url,
},
}, nil
}