/
transform.go
54 lines (47 loc) · 1.61 KB
/
transform.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
/*
* go-leia
* Copyright (C) 2021 Nuts community
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*
*/
package leia
import (
"regexp"
"strings"
)
// Transform is a function definition for transforming values and search terms.
type Transform func(interface{}) interface{}
// ToLower transforms all Unicode letters mapped to their lower case.
// It only transforms objects that conform to the Stringer interface.
func ToLower(terms interface{}) interface{} {
switch terms.(type) {
case string:
return strings.ToLower(terms.(string))
case Key:
return strings.ToLower(terms.(Key).String())
case []byte:
return strings.ToLower(string(terms.([]byte)))
default:
return terms
}
}
// Tokenizer is a function definition that transforms a text into tokens
type Tokenizer func(string) []string
const nonWhitespaceRegex = `\S+`
// WhiteSpaceTokenizer tokenizes the string based on the /\S/g regex
func WhiteSpaceTokenizer(text string) []string {
exp, _ := regexp.Compile(nonWhitespaceRegex)
return exp.FindAllString(text, -1)
}