forked from chenqinghe/baidu-ai-go-sdk
-
Notifications
You must be signed in to change notification settings - Fork 0
/
ocr.go
126 lines (83 loc) · 3.92 KB
/
ocr.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
package ocr
import (
"encoding/base64"
"github.com/chenqinghe/baidu-ai-go-sdk"
"io"
"io/ioutil"
)
const (
OCR_GENERAL_BASIC_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/general_basic"
OCR_GENERAL_WITH_LOCATION_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/general"
OCR_GENERAL_ENHANCED_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/general_enhanced"
)
const (
OCR_WEBIMAGE_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/webimage"
OCR_IDCARD_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/idcard"
OCR_BANKCARD_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/bankcard"
OCR_DRIVERLICENSE_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/driving_license"
OCR_VEHICLELICENSE_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/vehicle_license"
OCR_LICENSEPLATE_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/license_plate"
OCR_FORM_URL = "https://aip.baidubce.com/rest/2.0/solution/v1/form_ocr/request"
)
type OCRClient struct {
*gosdk.Client
}
func NewOCRClient(apiKey, secretKey string) *OCRClient {
return &OCRClient{
Client: gosdk.NewClient(apiKey, secretKey),
}
}
//GeneralRecognizeBasic 通用文字识别
//img 图片二进制数据
//conf 请求参数
func (oc *OCRClient) GeneralRecognizeBasic(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_GENERAL_BASIC_URL, defaultGeneralBasicParams, params...)
}
//GeneralRecognizeWithLocation 通用文字识别(含位置信息)
func (oc *OCRClient) GeneralRecognizeWithLocation(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_GENERAL_WITH_LOCATION_URL, defaultGeneralWithLocationParams, params...)
}
//GeneralRecognizeEnhanced 通用文字识别(含生僻字)
func (oc *OCRClient) GeneralRecognizeEnhanced(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_GENERAL_ENHANCED_URL, defaultDeneralEnhancedParams, params...)
}
func (oc *OCRClient) WebImageRecognize(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_WEBIMAGE_URL, defaultWebimgParams, params...)
}
func (oc *OCRClient) IdcardRecognize(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_IDCARD_URL, defaultIdcardParams, params...)
}
func (oc *OCRClient) BankcardRecognize(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_BANKCARD_URL, defaultBankcardParams, params...)
}
func (oc *OCRClient) DriverLicenseRecognize(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_DRIVERLICENSE_URL, defaultDriverLicenseParams, params...)
}
func (oc *OCRClient) VehicleLicenseRecognize(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_VEHICLELICENSE_URL, defaultVehicleLicenseParams, params...)
}
func (oc *OCRClient) LicensePlateRecognize(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_LICENSEPLATE_URL, defaultLicensePlateParams, params...)
}
func (oc *OCRClient) FromdataRecognize(imageReader io.Reader, params ...RequestParam) ([]byte, error) {
return oc.ocr(imageReader, OCR_FORM_URL, defaultFormParams, params...)
}
func (oc *OCRClient) ocr(imageReader io.Reader, url string, def map[string]interface{}, params ...RequestParam) ([]byte, error) {
requestParams, err := parseRequestParam(imageReader, def, params...)
if err != nil {
return nil, err
}
return oc.doRequest(url, requestParams)
}
func parseRequestParam(imageReader io.Reader, def map[string]interface{}, params ...RequestParam) (map[string]interface{}, error) {
imageBytes, err := ioutil.ReadAll(imageReader)
if err != nil {
return nil, err
}
imageBase64Str := base64.StdEncoding.EncodeToString(imageBytes)
def["image"] = imageBase64Str
for _, fn := range params {
fn(def)
}
return def, nil
}