Skip to content

Commit

Permalink
add method (*EtcdServer) IsRaftLoopBlocked to support checking whethe…
Browse files Browse the repository at this point in the history
…r the raft loop is blocked

Signed-off-by: Benjamin Wang <[email protected]>
  • Loading branch information
ahrtr committed Oct 8, 2023
1 parent 01a0d8b commit a398af0
Show file tree
Hide file tree
Showing 3 changed files with 97 additions and 0 deletions.
17 changes: 17 additions & 0 deletions server/etcdserver/raft.go
Original file line number Diff line number Diff line change
Expand Up @@ -99,6 +99,9 @@ type raftNode struct {

stopped chan struct{}
done chan struct{}

// used by liveness probe to check whether the raftloop is blocked.
dummyc chan struct{}
}

type raftNodeConfig struct {
Expand Down Expand Up @@ -142,6 +145,7 @@ func newRaftNode(cfg raftNodeConfig) *raftNode {
applyc: make(chan toApply),
stopped: make(chan struct{}),
done: make(chan struct{}),
dummyc: make(chan struct{}),
}
if r.heartbeat == 0 {
r.ticker = &time.Ticker{}
Expand Down Expand Up @@ -322,6 +326,8 @@ func (r *raftNode) start(rh *raftReadyHandler) {
// notify etcdserver that raft has already been notified or advanced.
raftAdvancedC <- struct{}{}
}
case <-r.dummyc:
r.lg.Debug("Received dummy event")
case <-r.stopped:
return
}
Expand Down Expand Up @@ -413,6 +419,17 @@ func (r *raftNode) onStop() {
close(r.done)
}

func (r *raftNode) trySendDummyEvent(timeout time.Duration) error {
select {
case r.dummyc <- struct{}{}:
case <-r.done:
case <-time.After(timeout):
return fmt.Errorf("failed to send dummy event in %s", timeout.String())
}

return nil
}

// for testing
func (r *raftNode) pauseSending() {
p := r.transport.(rafthttp.Pausable)
Expand Down
69 changes: 69 additions & 0 deletions server/etcdserver/raft_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,7 @@ import (
"testing"
"time"

"github.com/stretchr/testify/assert"
"go.uber.org/zap/zaptest"

"go.etcd.io/etcd/client/pkg/v3/types"
Expand Down Expand Up @@ -322,3 +323,71 @@ func TestStopRaftNodeMoreThanOnce(t *testing.T) {
}
}
}

func TestTrySendDummyEvent(t *testing.T) {
testCases := []struct {
name string
drainApply bool
stopped bool
expectBlocked bool
}{
{
name: "normal case",
drainApply: true,
stopped: false,
expectBlocked: false,
},
{
name: "blocked on apply",
drainApply: false,
stopped: false,
expectBlocked: true,
},
{
name: "not blocked due to stopped",
drainApply: false,
stopped: true,
expectBlocked: false,
},
}

for _, tc := range testCases {
tc := tc
t.Run(tc.name, func(t *testing.T) {
n := newNopReadyNode()

r := newRaftNode(raftNodeConfig{
lg: zaptest.NewLogger(t),
Node: n,
storage: mockstorage.NewStorageRecorder(""),
raftStorage: raft.NewMemoryStorage(),
transport: newNopTransporter(),
})
srv := &EtcdServer{lgMu: new(sync.RWMutex), lg: zaptest.NewLogger(t), r: *r}

srv.r.start(&raftReadyHandler{
getLead: func() uint64 { return 0 },
updateLead: func(uint64) {},
updateLeadership: func(bool) {},
})
defer srv.r.Stop()

n.readyc <- raft.Ready{
SoftState: &raft.SoftState{RaftState: raft.StateFollower},
Entries: []raftpb.Entry{{Type: raftpb.EntryConfChange}},
}
time.Sleep(time.Second)

if tc.drainApply {
_ = <-srv.r.applyc
}

if tc.stopped {
close(r.done)
}

err := r.trySendDummyEvent(2 * time.Second)
assert.Equal(t, tc.expectBlocked, err != nil, err)
})
}
}
11 changes: 11 additions & 0 deletions server/etcdserver/server.go
Original file line number Diff line number Diff line change
Expand Up @@ -1262,6 +1262,17 @@ func (s *EtcdServer) Stop() {
s.HardStop()
}

// IsRaftLoopBlocked checks whether the raft loop has blocked for at least
// the duration specified by `timeout`, and it defaults to 2*ElectionTimeout,
// which is the maximum time to trigger a new leader election.
// If the returned error isn't nil, then it's blocked; otherwise not.
func (s *EtcdServer) IsRaftLoopBlocked(timeout time.Duration) error {
if timeout == 0 {
timeout = 2 * s.Cfg.ElectionTimeout()
}
return s.r.trySendDummyEvent(timeout)
}

// ReadyNotify returns a channel that will be closed when the server
// is ready to serve client requests
func (s *EtcdServer) ReadyNotify() <-chan struct{} { return s.readych }
Expand Down

0 comments on commit a398af0

Please sign in to comment.