forked from tikv/pd
-
Notifications
You must be signed in to change notification settings - Fork 0
/
tso.go
204 lines (171 loc) · 5.78 KB
/
tso.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
// Copyright 2016 PingCAP, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// See the License for the specific language governing permissions and
// limitations under the License.
package server
import (
"path"
"sync/atomic"
"time"
"github.com/coreos/etcd/clientv3"
"github.com/pingcap/kvproto/pkg/pdpb"
"github.com/pkg/errors"
log "github.com/sirupsen/logrus"
)
const (
// update timestamp every updateTimestampStep.
updateTimestampStep = 50 * time.Millisecond
updateTimestampGuard = time.Millisecond
maxLogical = int64(1 << 18)
)
var (
zeroTime = time.Time{}
)
type atomicObject struct {
physical time.Time
logical int64
}
func (s *Server) getTimestampPath() string {
return path.Join(s.rootPath, "timestamp")
}
func (s *Server) loadTimestamp() (time.Time, error) {
data, err := getValue(s.client, s.getTimestampPath())
if err != nil {
return zeroTime, err
}
if len(data) == 0 {
return zeroTime, nil
}
return parseTimestamp(data)
}
// save timestamp, if lastTs is 0, we think the timestamp doesn't exist, so create it,
// otherwise, update it.
func (s *Server) saveTimestamp(ts time.Time) error {
data := uint64ToBytes(uint64(ts.UnixNano()))
key := s.getTimestampPath()
resp, err := s.leaderTxn().Then(clientv3.OpPut(key, string(data))).Commit()
if err != nil {
return errors.WithStack(err)
}
if !resp.Succeeded {
return errors.New("save timestamp failed, maybe we lost leader")
}
s.lastSavedTime = ts
return nil
}
func (s *Server) syncTimestamp() error {
tsoCounter.WithLabelValues("sync").Inc()
last, err := s.loadTimestamp()
if err != nil {
return err
}
next := time.Now()
// gofail: var fallBackSync bool
// if fallBackSync {
// next = next.Add(time.Hour)
// }
// If the current system time minus the saved etcd timestamp is less than `updateTimestampGuard`,
// the timestamp allocation will start from the saved etcd timestamp temporarily.
if subTimeByWallClock(next, last) < updateTimestampGuard {
log.Errorf("system time may be incorrect: last: %v next %v", last, next)
next = last.Add(updateTimestampGuard)
}
save := next.Add(s.cfg.TsoSaveInterval.Duration)
if err = s.saveTimestamp(save); err != nil {
return err
}
tsoCounter.WithLabelValues("sync_ok").Inc()
log.Infof("sync and save timestamp: last %v save %v next %v", last, save, next)
current := &atomicObject{
physical: next,
}
s.ts.Store(current)
return nil
}
// This function will do two things:
// 1. When the logical time is going to be used up, the current physical time needs to increase.
// 2. If the time window is not enough, which means the saved etcd time minus the next physical time
// is less than or equal to `updateTimestampGuard`, it will need to be updated and save the
// next physical time plus `TsoSaveInterval` into etcd.
//
// Here is some constraints that this function must satisfy:
// 1. The physical time is monotonically increasing.
// 2. The saved time is monotonically increasing.
// 3. The physical time is always less than the saved timestamp.
func (s *Server) updateTimestamp() error {
prev := s.ts.Load().(*atomicObject)
now := time.Now()
// gofail: var fallBackUpdate bool
// if fallBackUpdate {
// now = now.Add(time.Hour)
// }
tsoCounter.WithLabelValues("save").Inc()
jetLag := subTimeByWallClock(now, prev.physical)
if jetLag > 3*updateTimestampStep {
log.Warnf("clock offset: %v, prev: %v, now: %v", jetLag, prev.physical, now)
tsoCounter.WithLabelValues("slow_save").Inc()
}
if jetLag < 0 {
tsoCounter.WithLabelValues("system_time_slow").Inc()
}
var next time.Time
prevLogical := atomic.LoadInt64(&prev.logical)
// If the system time is greater, it will be synchronized with the system time.
if jetLag > updateTimestampGuard {
next = now
} else if prevLogical > maxLogical/2 {
// The reason choosing maxLogical/2 here is that it's big enough for common cases.
// Because there is enough timestamp can be allocated before next update.
log.Warnf("the logical time may be not enough, prevLogical: %v", prevLogical)
next = prev.physical.Add(time.Millisecond)
} else {
// It will still use the previous physical time to alloc the timestamp.
tsoCounter.WithLabelValues("skip_save").Inc()
return nil
}
// It is not safe to increase the physical time to `next`.
// The time window needs to be updated and saved to etcd.
if subTimeByWallClock(s.lastSavedTime, next) <= updateTimestampGuard {
save := next.Add(s.cfg.TsoSaveInterval.Duration)
if err := s.saveTimestamp(save); err != nil {
return err
}
}
current := &atomicObject{
physical: next,
logical: 0,
}
s.ts.Store(current)
metadataGauge.WithLabelValues("tso").Set(float64(next.Unix()))
return nil
}
const maxRetryCount = 100
func (s *Server) getRespTS(count uint32) (pdpb.Timestamp, error) {
var resp pdpb.Timestamp
for i := 0; i < maxRetryCount; i++ {
current, ok := s.ts.Load().(*atomicObject)
if !ok || current.physical == zeroTime {
log.Errorf("we haven't synced timestamp ok, wait and retry, retry count %d", i)
time.Sleep(200 * time.Millisecond)
continue
}
resp.Physical = current.physical.UnixNano() / int64(time.Millisecond)
resp.Logical = atomic.AddInt64(¤t.logical, int64(count))
if resp.Logical >= maxLogical {
log.Errorf("logical part outside of max logical interval %v, please check ntp time, retry count %d", resp, i)
tsoCounter.WithLabelValues("logical_overflow").Inc()
time.Sleep(updateTimestampStep)
continue
}
return resp, nil
}
return resp, errors.New("can not get timestamp")
}