-
Notifications
You must be signed in to change notification settings - Fork 0
/
text.go
97 lines (83 loc) · 2.01 KB
/
text.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
package utils
import (
"bytes"
"encoding/json"
"golang.org/x/text/unicode/norm"
"io"
"regexp"
"strings"
)
func Normalize(s string) string {
return norm.NFKC.String(s)
}
func JSONEncoder(w io.Writer) *json.Encoder {
enc := json.NewEncoder(w)
enc.SetEscapeHTML(false)
return enc
}
func JSONMarshal(v interface{}) ([]byte, error) {
var b bytes.Buffer
err := JSONEncoder(&b).Encode(v)
return b.Bytes(), err
}
func JSONString(v interface{}) string {
var s strings.Builder
enc := JSONEncoder(&s)
enc.SetIndent("", " ")
_ = enc.Encode(v)
return s.String()
}
func Snake(s string) string {
s = addWordBoundariesToNumbers(s)
s = strings.Trim(s, " ")
n := ""
for i, v := range s {
// treat acronyms as words, eg for JSONData -> JSON is a whole word
nextCaseIsChanged := false
if i+1 < len(s) {
next := s[i+1]
if (v >= 'A' && v <= 'Z' && next >= 'a' && next <= 'z') || (v >= 'a' && v <= 'z' && next >= 'A' && next <= 'Z') {
nextCaseIsChanged = true
}
}
if i > 0 && n[len(n)-1] != '_' && nextCaseIsChanged {
// add underscore if next letter case type is changed
if v >= 'A' && v <= 'Z' {
n += "_" + string(v)
} else if v >= 'a' && v <= 'z' {
n += string(v) + "_"
}
} else if v == ' ' || v == '_' || v == '-' {
// replace spaces/underscores with delimiters
n += "_"
} else {
n = n + string(v)
}
}
return strings.ToLower(n)
}
var numberSequence = regexp.MustCompile(`([a-zA-Z])(\d+)([a-zA-Z]?)`)
var numberReplacement = []byte(`$1 $2 $3`)
func addWordBoundariesToNumbers(s string) string {
b := []byte(s)
b = numberSequence.ReplaceAll(b, numberReplacement)
return string(b)
}
var nullChar = byte(0)
var backspaceChar = byte(8)
var crChar = byte(13)
var subsChar = byte(26)
func isControlChar(ch byte) bool {
return (ch > nullChar && ch < backspaceChar) || (ch > crChar && ch < subsChar)
}
func IsBinary(content []byte) bool {
if len(content) >= 8000 {
content = content[:8000]
}
for _, c := range content {
if isControlChar(c) {
return true
}
}
return false
}