fix(grpc/client): clear reconnecting on failure and requeue reconnection after backoff

Ensure the reconnecting flag is reset on failed attempts so subsequent retries can proceed, and explicitly trigger a reconnection attempt after the backoff period to keep retrying recovery.
2026-01-21 17:21:09 +01:00 · 2025-10-21 22:03:17 +08:00
parent 138bed5c05
commit 18fc84afb7
1 changed files with 11 additions and 1 deletions
--- a/core/grpc/client/client.go
+++ b/core/grpc/client/client.go
@@ -817,7 +817,7 @@ func (c *GrpcClient) executeReconnection() {
 		c.Errorf("reconnection failed: %v", err)
 		c.recordFailure()

-		// Clear reconnecting flag on failure
+		// Clear reconnecting flag on failure so we can retry
 		c.reconnectMux.Lock()
 		c.reconnecting = false
 		c.reconnectMux.Unlock()
@@ -826,6 +826,16 @@ func (c *GrpcClient) executeReconnection() {
 		backoffDuration := c.calculateBackoff()
 		c.Warnf("will retry reconnection after %v backoff", backoffDuration)
 		time.Sleep(backoffDuration)
+
+		// Trigger another reconnection attempt after backoff
+		// This ensures we keep trying even if network was down during first attempt
+		c.Debugf("backoff complete, triggering reconnection retry")
+		select {
+		case c.reconnect <- struct{}{}:
+			c.Debugf("reconnection retry triggered")
+		default:
+			c.Debugf("reconnection retry already pending")
+		}
 	} else {
 		c.recordSuccess()
 		c.Infof("reconnection successful - connection state: %s, registered: %v", c.getState(), c.IsRegistered())