Skip to content

Commit

Permalink
etcdserver: add more detailed traces on linearized reading
Browse files Browse the repository at this point in the history
To improve debuggability of `agreement among raft nodes before
linearized reading`, we added some tracing inside
`linearizableReadLoop`.

This will allow us to know the timing of `s.r.ReadIndex` vs
`s.applyWait.Wait(rs.Index)`.

Signed-off-by: Chao Chen <chaochn@amazon.com>
  • Loading branch information
PierreZ authored and chaochn47 committed Jul 19, 2022
1 parent d58a0c0 commit f298598
Show file tree
Hide file tree
Showing 2 changed files with 23 additions and 2 deletions.
18 changes: 16 additions & 2 deletions etcdserver/v3_server.go
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ import (
"bytes"
"context"
"encoding/binary"
"strconv"
"time"

"go.etcd.io/etcd/auth"
Expand Down Expand Up @@ -710,6 +711,9 @@ func (s *EtcdServer) linearizableReadLoop() {
return
}

// as a single loop is can unlock multiple reads, it is not very useful
// to propagate the trace from Txn or Range.
trace := traceutil.New("linearizableReadLoop", s.getLogger())
nextnr := newNotifier()

s.readMu.Lock()
Expand Down Expand Up @@ -782,16 +786,26 @@ func (s *EtcdServer) linearizableReadLoop() {
if !done {
continue
}
trace.Step("read index received")

if ai := s.getAppliedIndex(); ai < rs.Index {
index := rs.Index
trace.AddField(traceutil.Field{Key: "readStateIndex", Value: index})

ai := s.getAppliedIndex()
trace.AddField(traceutil.Field{Key: "appliedIndex", Value: strconv.FormatUint(ai, 10)})

if ai < index {
select {
case <-s.applyWait.Wait(rs.Index):
case <-s.applyWait.Wait(index):
case <-s.stopping:
return
}
}
// unblock all l-reads requested at indices before rs.Index
nr.notify(nil)
trace.Step("applied index is now lower than readState.Index")

trace.LogAllStepsIfLong(traceThreshold)
}
}

Expand Down
7 changes: 7 additions & 0 deletions pkg/traceutil/trace.go
Original file line number Diff line number Diff line change
Expand Up @@ -138,6 +138,13 @@ func (t *Trace) LogIfLong(threshold time.Duration) {
}
}

// LogAllStepsIfLong dumps all logs if the duration is longer than threshold
func (t *Trace) LogAllStepsIfLong(threshold time.Duration) {
if time.Since(t.startTime) > threshold {
t.LogWithStepThreshold(0)
}
}

// LogWithStepThreshold only dumps step whose duration is longer than step threshold
func (t *Trace) LogWithStepThreshold(threshold time.Duration) {
msg, fs := t.logInfo(threshold)
Expand Down

0 comments on commit f298598

Please sign in to comment.