-
Notifications
You must be signed in to change notification settings - Fork 671
/
topological.go
645 lines (541 loc) · 20.1 KB
/
topological.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
// Copyright (C) 2019-2021, Ava Labs, Inc. All rights reserved.
// See the file LICENSE for licensing terms.
package snowman
import (
"errors"
"fmt"
"strings"
"go.uber.org/zap"
"github.com/ava-labs/avalanchego/ids"
"github.com/ava-labs/avalanchego/snow"
"github.com/ava-labs/avalanchego/snow/choices"
"github.com/ava-labs/avalanchego/snow/consensus/metrics"
"github.com/ava-labs/avalanchego/snow/consensus/snowball"
)
var (
errDuplicateAdd = errors.New("duplicate block add")
_ Factory = &TopologicalFactory{}
_ Consensus = &Topological{}
)
// TopologicalFactory implements Factory by returning a topological struct
type TopologicalFactory struct{}
func (TopologicalFactory) New() Consensus { return &Topological{} }
// Topological implements the Snowman interface by using a tree tracking the
// strongly preferred branch. This tree structure amortizes network polls to
// vote on more than just the next block.
type Topological struct {
metrics.Latency
metrics.Polls
metrics.Height
// pollNumber is the number of times RecordPolls has been called
pollNumber uint64
// ctx is the context this snowman instance is executing in
ctx *snow.ConsensusContext
// params are the parameters that should be used to initialize snowball
// instances
params snowball.Parameters
// head is the last accepted block
head ids.ID
// height is the height of the last accepted block
height uint64
// blocks stores the last accepted block and all the pending blocks
blocks map[ids.ID]*snowmanBlock // blockID -> snowmanBlock
// preferredIDs stores the set of IDs that are currently preferred.
preferredIDs ids.Set
// tail is the preferred block with no children
tail ids.ID
// Used in [calculateInDegree] and.
// Should only be accessed in that method.
// We use this one instance of ids.Set instead of creating a
// new ids.Set during each call to [calculateInDegree].
leaves ids.Set
// Kahn nodes used in [calculateInDegree] and [markAncestorInDegrees].
// Should only be accessed in those methods.
// We use this one map instead of creating a new map
// during each call to [calculateInDegree].
kahnNodes map[ids.ID]kahnNode
}
// Used to track the kahn topological sort status
type kahnNode struct {
// inDegree is the number of children that haven't been processed yet. If
// inDegree is 0, then this node is a leaf
inDegree int
// votes for all the children of this node, so far
votes ids.Bag
}
// Used to track which children should receive votes
type votes struct {
// parentID is the parent of all the votes provided in the votes bag
parentID ids.ID
// votes for all the children of the parent
votes ids.Bag
}
func (ts *Topological) Initialize(ctx *snow.ConsensusContext, params snowball.Parameters, rootID ids.ID, rootHeight uint64) error {
if err := params.Verify(); err != nil {
return err
}
latencyMetrics, err := metrics.NewLatency("blks", "block(s)", ctx.Log, "", ctx.Registerer)
if err != nil {
return err
}
ts.Latency = latencyMetrics
pollsMetrics, err := metrics.NewPolls("", ctx.Registerer)
if err != nil {
return err
}
ts.Polls = pollsMetrics
heightMetrics, err := metrics.NewHeight("", ctx.Registerer)
if err != nil {
return err
}
ts.Height = heightMetrics
ts.leaves = ids.Set{}
ts.kahnNodes = make(map[ids.ID]kahnNode)
ts.ctx = ctx
ts.params = params
ts.head = rootID
ts.height = rootHeight
ts.blocks = map[ids.ID]*snowmanBlock{
rootID: {sm: ts},
}
ts.tail = rootID
// Initially set the height to the last accepted block.
ts.Height.Accepted(ts.height)
return nil
}
func (ts *Topological) Parameters() snowball.Parameters { return ts.params }
func (ts *Topological) NumProcessing() int { return len(ts.blocks) - 1 }
func (ts *Topological) Add(blk Block) error {
blkID := blk.ID()
// Make sure a block is not inserted twice. This enforces the invariant that
// blocks are always added in topological order. Essentially, a block that
// is being added should never have a child that was already added.
// Additionally, this prevents any edge cases that may occur due to adding
// different blocks with the same ID.
if ts.Decided(blk) || ts.Processing(blkID) {
return errDuplicateAdd
}
ts.Latency.Issued(blkID, ts.pollNumber)
parentID := blk.Parent()
parentNode, ok := ts.blocks[parentID]
if !ok {
// If the ancestor is missing, this means the ancestor must have already
// been pruned. Therefore, the dependent should be transitively
// rejected.
if err := blk.Reject(); err != nil {
return err
}
ts.Latency.Rejected(blkID, ts.pollNumber)
return nil
}
// add the block as a child of its parent, and add the block to the tree
parentNode.AddChild(blk)
ts.blocks[blkID] = &snowmanBlock{
sm: ts,
blk: blk,
}
// If we are extending the tail, this is the new tail
if ts.tail == parentID {
ts.tail = blkID
ts.preferredIDs.Add(blkID)
}
return nil
}
func (ts *Topological) Decided(blk Block) bool {
// If the block is decided, then it must have been previously issued.
if blk.Status().Decided() {
return true
}
// If the block is marked as fetched, we can check if it has been
// transitively rejected.
return blk.Status() == choices.Processing && blk.Height() <= ts.height
}
func (ts *Topological) Processing(blkID ids.ID) bool {
// The last accepted block is in the blocks map, so we first must ensure the
// requested block isn't the last accepted block.
if blkID == ts.head {
return false
}
// If the block is in the map of current blocks and not the head, then the
// block is currently processing.
_, ok := ts.blocks[blkID]
return ok
}
func (ts *Topological) IsPreferred(blk Block) bool {
// If the block is accepted, then it must be transitively preferred.
if blk.Status() == choices.Accepted {
return true
}
return ts.preferredIDs.Contains(blk.ID())
}
func (ts *Topological) Preference() ids.ID { return ts.tail }
// The votes bag contains at most K votes for blocks in the tree. If there is a
// vote for a block that isn't in the tree, the vote is dropped.
//
// Votes are propagated transitively towards the genesis. All blocks in the tree
// that result in at least Alpha votes will record the poll on their children.
// Every other block will have an unsuccessful poll registered.
//
// After collecting which blocks should be voted on, the polls are registered
// and blocks are accepted/rejected as needed. The tail is then updated to equal
// the leaf on the preferred branch.
//
// To optimize the theoretical complexity of the vote propagation, a topological
// sort is done over the blocks that are reachable from the provided votes.
// During the sort, votes are pushed towards the genesis. To prevent interating
// over all blocks that had unsuccessful polls, we set a flag on the block to
// know that any future traversal through that block should register an
// unsuccessful poll on that block and every descendant block.
//
// The complexity of this function is:
// - Runtime = 3 * |live set| + |votes|
// - Space = 2 * |live set| + |votes|
func (ts *Topological) RecordPoll(voteBag ids.Bag) error {
// Register a new poll call
ts.pollNumber++
var voteStack []votes
if voteBag.Len() >= ts.params.Alpha {
// Since we received at least alpha votes, it's possible that
// we reached an alpha majority on a processing block.
// We must perform the traversals to calculate all block
// that reached an alpha majority.
// Populates [ts.kahnNodes] and [ts.leaves]
// Runtime = |live set| + |votes| ; Space = |live set| + |votes|
ts.calculateInDegree(voteBag)
// Runtime = |live set| ; Space = |live set|
voteStack = ts.pushVotes()
}
// Runtime = |live set| ; Space = Constant
preferred, err := ts.vote(voteStack)
if err != nil {
return err
}
// If the set of preferred IDs already contains the preference, then the
// tail is guaranteed to already be set correctly. This is because the value
// returned from vote reports the next preferred block after the last
// preferred block that was voted for. If this block was previously
// preferred, then we know that following the preferences down the chain
// will return the current tail.
if ts.preferredIDs.Contains(preferred) {
return nil
}
// Runtime = |live set| ; Space = Constant
ts.preferredIDs.Clear()
ts.tail = preferred
startBlock := ts.blocks[ts.tail]
// Runtime = |live set| ; Space = Constant
// Traverse from the preferred ID to the last accepted ancestor.
for block := startBlock; !block.Accepted(); {
ts.preferredIDs.Add(block.blk.ID())
block = ts.blocks[block.blk.Parent()]
}
// Traverse from the preferred ID to the preferred child until there are no
// children.
for block := startBlock; block.sb != nil; block = ts.blocks[ts.tail] {
ts.tail = block.sb.Preference()
ts.preferredIDs.Add(ts.tail)
}
return nil
}
func (ts *Topological) Finalized() bool { return len(ts.blocks) == 1 }
// HealthCheck returns information about the consensus health.
func (ts *Topological) HealthCheck() (interface{}, error) {
numOutstandingBlks := ts.Latency.NumProcessing()
isOutstandingBlks := numOutstandingBlks <= ts.params.MaxOutstandingItems
healthy := isOutstandingBlks
details := map[string]interface{}{
"outstandingBlocks": numOutstandingBlks,
}
// check for long running blocks
timeReqRunning := ts.Latency.MeasureAndGetOldestDuration()
isProcessingTime := timeReqRunning <= ts.params.MaxItemProcessingTime
healthy = healthy && isProcessingTime
details["longestRunningBlock"] = timeReqRunning.String()
if !healthy {
var errorReasons []string
if !isOutstandingBlks {
errorReasons = append(errorReasons, fmt.Sprintf("number of outstanding blocks %d > %d", numOutstandingBlks, ts.params.MaxOutstandingItems))
}
if !isProcessingTime {
errorReasons = append(errorReasons, fmt.Sprintf("block processing time %s > %s", timeReqRunning, ts.params.MaxItemProcessingTime))
}
return details, fmt.Errorf("snowman consensus is not healthy reason: %s", strings.Join(errorReasons, ", "))
}
return details, nil
}
// takes in a list of votes and sets up the topological ordering. Returns the
// reachable section of the graph annotated with the number of inbound edges and
// the non-transitively applied votes. Also returns the list of leaf blocks.
func (ts *Topological) calculateInDegree(votes ids.Bag) {
// Clear the Kahn node set
for k := range ts.kahnNodes {
delete(ts.kahnNodes, k)
}
// Clear the leaf set
ts.leaves.Clear()
for _, vote := range votes.List() {
votedBlock, validVote := ts.blocks[vote]
// If the vote is for a block that isn't in the current pending set,
// then the vote is dropped
if !validVote {
continue
}
// If the vote is for the last accepted block, the vote is dropped
if votedBlock.Accepted() {
continue
}
// The parent contains the snowball instance of its children
parentID := votedBlock.blk.Parent()
// Add the votes for this block to the parent's set of responses
numVotes := votes.Count(vote)
kahn, previouslySeen := ts.kahnNodes[parentID]
kahn.votes.AddCount(vote, numVotes)
ts.kahnNodes[parentID] = kahn
// If the parent block already had registered votes, then there is no
// need to iterate into the parents
if previouslySeen {
continue
}
// If I've never seen this parent block before, it is currently a leaf.
ts.leaves.Add(parentID)
// iterate through all the block's ancestors and set up the inDegrees of
// the blocks
for n := ts.blocks[parentID]; !n.Accepted(); n = ts.blocks[parentID] {
parentID = n.blk.Parent()
// Increase the inDegree by one
kahn := ts.kahnNodes[parentID]
kahn.inDegree++
ts.kahnNodes[parentID] = kahn
// If we have already seen this block, then we shouldn't increase
// the inDegree of the ancestors through this block again.
if kahn.inDegree != 1 {
break
}
// If I am transitively seeing this block for the first time, either
// the block was previously unknown or it was previously a leaf.
// Regardless, it shouldn't be tracked as a leaf.
ts.leaves.Remove(parentID)
}
}
}
// convert the tree into a branch of snowball instances with at least alpha
// votes
func (ts *Topological) pushVotes() []votes {
voteStack := make([]votes, 0, len(ts.kahnNodes))
for ts.leaves.Len() > 0 {
// Pop one element of [leaves]
leafID, _ := ts.leaves.Pop()
// Should never return false because we just
// checked that [ts.leaves] is non-empty.
// get the block and sort information about the block
kahnNode := ts.kahnNodes[leafID]
block := ts.blocks[leafID]
// If there are at least Alpha votes, then this block needs to record
// the poll on the snowball instance
if kahnNode.votes.Len() >= ts.params.Alpha {
voteStack = append(voteStack, votes{
parentID: leafID,
votes: kahnNode.votes,
})
}
// If the block is accepted, then we don't need to push votes to the
// parent block
if block.Accepted() {
continue
}
parentID := block.blk.Parent()
// Remove an inbound edge from the parent kahn node and push the votes.
parentKahnNode := ts.kahnNodes[parentID]
parentKahnNode.inDegree--
parentKahnNode.votes.AddCount(leafID, kahnNode.votes.Len())
ts.kahnNodes[parentID] = parentKahnNode
// If the inDegree is zero, then the parent node is now a leaf
if parentKahnNode.inDegree == 0 {
ts.leaves.Add(parentID)
}
}
return voteStack
}
// apply votes to the branch that received an Alpha threshold and returns the
// next preferred block after the last preferred block that received an Alpha
// threshold.
func (ts *Topological) vote(voteStack []votes) (ids.ID, error) {
// If the voteStack is empty, then the full tree should falter. This won't
// change the preferred branch.
if len(voteStack) == 0 {
headBlock := ts.blocks[ts.head]
headBlock.shouldFalter = true
if numProcessing := len(ts.blocks) - 1; numProcessing > 0 {
ts.ctx.Log.Verbo("no progress was made after processing pending blocks",
zap.Int("numProcessing", numProcessing),
)
ts.Polls.Failed()
}
return ts.tail, nil
}
// keep track of the new preferred block
newPreferred := ts.head
onPreferredBranch := true
for len(voteStack) > 0 {
// pop a vote off the stack
newStackSize := len(voteStack) - 1
vote := voteStack[newStackSize]
voteStack = voteStack[:newStackSize]
// get the block that we are going to vote on
parentBlock, notRejected := ts.blocks[vote.parentID]
// if the block block we are going to vote on was already rejected, then
// we should stop applying the votes
if !notRejected {
break
}
// keep track of transitive falters to propagate to this block's
// children
shouldTransitivelyFalter := parentBlock.shouldFalter
// if the block was previously marked as needing to falter, the block
// should falter before applying the vote
if shouldTransitivelyFalter {
ts.ctx.Log.Verbo("resetting confidence below parent",
zap.Stringer("parentID", vote.parentID),
)
parentBlock.sb.RecordUnsuccessfulPoll()
parentBlock.shouldFalter = false
}
// apply the votes for this snowball instance
parentBlock.sb.RecordPoll(vote.votes)
// Only accept when you are finalized and the head.
if parentBlock.sb.Finalized() && ts.head == vote.parentID {
if err := ts.acceptPreferredChild(parentBlock); err != nil {
return ids.ID{}, err
}
// by accepting the child of parentBlock, the last accepted block is
// no longer voteParentID, but its child. So, voteParentID can be
// removed from the tree.
delete(ts.blocks, vote.parentID)
}
// If we are on the preferred branch, then the parent's preference is
// the next block on the preferred branch.
parentPreference := parentBlock.sb.Preference()
if onPreferredBranch {
newPreferred = parentPreference
}
// Get the ID of the child that is having a RecordPoll called. All other
// children will need to have their confidence reset. If there isn't a
// child having RecordPoll called, then the nextID will default to the
// nil ID.
nextID := ids.ID{}
if len(voteStack) > 0 {
nextID = voteStack[newStackSize-1].parentID
}
// If we are on the preferred branch and the nextID is the preference of
// the snowball instance, then we are following the preferred branch.
onPreferredBranch = onPreferredBranch && nextID == parentPreference
// If there wasn't an alpha threshold on the branch (either on this vote
// or a past transitive vote), I should falter now.
for childID := range parentBlock.children {
// If we don't need to transitively falter and the child is going to
// have RecordPoll called on it, then there is no reason to reset
// the block's confidence
if !shouldTransitivelyFalter && childID == nextID {
continue
}
// If we finalized a child of the current block, then all other
// children will have been rejected and removed from the tree.
// Therefore, we need to make sure the child is still in the tree.
childBlock, notRejected := ts.blocks[childID]
if notRejected {
ts.ctx.Log.Verbo("defering confidence reset of child block",
zap.Stringer("childID", childID),
)
ts.ctx.Log.Verbo("voting for next block",
zap.Stringer("nextID", nextID),
)
// If the child is ever voted for positively, the confidence
// must be reset first.
childBlock.shouldFalter = true
}
}
}
ts.Polls.Successful()
return newPreferred, nil
}
// Accepts the preferred child of the provided snowman block. By accepting the
// preferred child, all other children will be rejected. When these children are
// rejected, all their descendants will be rejected.
//
// We accept a block once its parent's snowball instance has finalized
// with it as the preference.
func (ts *Topological) acceptPreferredChild(n *snowmanBlock) error {
// We are finalizing the block's child, so we need to get the preference
pref := n.sb.Preference()
// Get the child and accept it
child := n.children[pref]
// Notify anyone listening that this block was accepted.
bytes := child.Bytes()
// Note that DecisionAcceptor.Accept / ConsensusAcceptor.Accept must be
// called before child.Accept to honor Acceptor.Accept's invariant.
if err := ts.ctx.DecisionAcceptor.Accept(ts.ctx, pref, bytes); err != nil {
return err
}
if err := ts.ctx.ConsensusAcceptor.Accept(ts.ctx, pref, bytes); err != nil {
return err
}
ts.ctx.Log.Trace("accepting block",
zap.Stringer("blkID", pref),
)
if err := child.Accept(); err != nil {
return err
}
// Because this is the newest accepted block, this is the new head.
ts.head = pref
ts.height = child.Height()
// Remove the decided block from the set of processing IDs, as its status
// now implies its preferredness.
ts.preferredIDs.Remove(pref)
ts.Latency.Accepted(pref, ts.pollNumber)
ts.Height.Accepted(ts.height)
// Because ts.blocks contains the last accepted block, we don't delete the
// block from the blocks map here.
rejects := make([]ids.ID, 0, len(n.children)-1)
for childID, child := range n.children {
if childID == pref {
// don't reject the block we just accepted
continue
}
ts.ctx.Log.Trace("rejecting block",
zap.String("reason", "conflict with accepted block"),
zap.Stringer("rejectedID", childID),
zap.Stringer("conflictedID", pref),
)
if err := child.Reject(); err != nil {
return err
}
ts.Latency.Rejected(childID, ts.pollNumber)
// Track which blocks have been directly rejected
rejects = append(rejects, childID)
}
// reject all the descendants of the blocks we just rejected
return ts.rejectTransitively(rejects)
}
// Takes in a list of rejected ids and rejects all descendants of these IDs
func (ts *Topological) rejectTransitively(rejected []ids.ID) error {
// the rejected array is treated as a stack, with the next element at index
// 0 and the last element at the end of the slice.
for len(rejected) > 0 {
// pop the rejected ID off the stack
newRejectedSize := len(rejected) - 1
rejectedID := rejected[newRejectedSize]
rejected = rejected[:newRejectedSize]
// get the rejected node, and remove it from the tree
rejectedNode := ts.blocks[rejectedID]
delete(ts.blocks, rejectedID)
for childID, child := range rejectedNode.children {
if err := child.Reject(); err != nil {
return err
}
ts.Latency.Rejected(childID, ts.pollNumber)
// add the newly rejected block to the end of the stack
rejected = append(rejected, childID)
}
}
return nil
}