-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathAttention.go
executable file
·129 lines (109 loc) · 2.52 KB
/
Attention.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
package layer
import tf "github.com/galeone/tensorflow/tensorflow/go"
type LAttention struct {
causal bool
dropout float64
dtype DataType
inputs []Layer
name string
shape tf.Shape
trainable bool
useScale bool
layerWeights []*tf.Tensor
}
func Attention() *LAttention {
return &LAttention{
causal: false,
dropout: 0,
dtype: Float32,
name: UniqueName("attention"),
trainable: true,
useScale: false,
}
}
func (l *LAttention) SetCausal(causal bool) *LAttention {
l.causal = causal
return l
}
func (l *LAttention) SetDropout(dropout float64) *LAttention {
l.dropout = dropout
return l
}
func (l *LAttention) SetDtype(dtype DataType) *LAttention {
l.dtype = dtype
return l
}
func (l *LAttention) SetName(name string) *LAttention {
l.name = name
return l
}
func (l *LAttention) SetShape(shape tf.Shape) *LAttention {
l.shape = shape
return l
}
func (l *LAttention) SetTrainable(trainable bool) *LAttention {
l.trainable = trainable
return l
}
func (l *LAttention) SetUseScale(useScale bool) *LAttention {
l.useScale = useScale
return l
}
func (l *LAttention) SetLayerWeights(layerWeights []*tf.Tensor) *LAttention {
l.layerWeights = layerWeights
return l
}
func (l *LAttention) GetShape() tf.Shape {
return l.shape
}
func (l *LAttention) GetDtype() DataType {
return l.dtype
}
func (l *LAttention) SetInputs(inputs ...Layer) Layer {
l.inputs = inputs
return l
}
func (l *LAttention) GetInputs() []Layer {
return l.inputs
}
func (l *LAttention) GetName() string {
return l.name
}
func (l *LAttention) GetLayerWeights() []*tf.Tensor {
return l.layerWeights
}
type jsonConfigLAttention struct {
ClassName string `json:"class_name"`
Name string `json:"name"`
Config map[string]interface{} `json:"config"`
InboundNodes [][][]interface{} `json:"inbound_nodes"`
}
func (l *LAttention) GetKerasLayerConfig() interface{} {
inboundNodes := [][][]interface{}{
{},
}
for _, input := range l.inputs {
inboundNodes[0] = append(inboundNodes[0], []interface{}{
input.GetName(),
0,
0,
map[string]bool{},
})
}
return jsonConfigLAttention{
ClassName: "Attention",
Name: l.name,
Config: map[string]interface{}{
"causal": l.causal,
"dropout": l.dropout,
"dtype": l.dtype.String(),
"name": l.name,
"trainable": l.trainable,
"use_scale": l.useScale,
},
InboundNodes: inboundNodes,
}
}
func (l *LAttention) GetCustomLayerDefinition() string {
return ``
}