diff --git a/docs/generated/http/full.md b/docs/generated/http/full.md index b1d2f7551d91..08e940161f3d 100644 --- a/docs/generated/http/full.md +++ b/docs/generated/http/full.md @@ -1309,6 +1309,7 @@ RangeProblems describes issues reported by a range. For internal use only. | quiescent_equals_ticking | [bool](#cockroach.server.serverpb.RaftDebugResponse-bool) | | Quiescent ranges do not tick by definition, but we track this in two different ways and suspect that they're getting out of sync. If the replica's quiescent flag doesn't agree with the store's list of replicas that are ticking, warn about it. | [reserved](#support-status) | | raft_log_too_large | [bool](#cockroach.server.serverpb.RaftDebugResponse-bool) | | When the raft log is too large, it can be a symptom of other issues. | [reserved](#support-status) | | circuit_breaker_error | [bool](#cockroach.server.serverpb.RaftDebugResponse-bool) | | | [reserved](#support-status) | +| paused_followers | [bool](#cockroach.server.serverpb.RaftDebugResponse-bool) | | | [reserved](#support-status) | @@ -1554,6 +1555,7 @@ RangeProblems describes issues reported by a range. For internal use only. | quiescent_equals_ticking | [bool](#cockroach.server.serverpb.RangesResponse-bool) | | Quiescent ranges do not tick by definition, but we track this in two different ways and suspect that they're getting out of sync. If the replica's quiescent flag doesn't agree with the store's list of replicas that are ticking, warn about it. | [reserved](#support-status) | | raft_log_too_large | [bool](#cockroach.server.serverpb.RangesResponse-bool) | | When the raft log is too large, it can be a symptom of other issues. | [reserved](#support-status) | | circuit_breaker_error | [bool](#cockroach.server.serverpb.RangesResponse-bool) | | | [reserved](#support-status) | +| paused_followers | [bool](#cockroach.server.serverpb.RangesResponse-bool) | | | [reserved](#support-status) | @@ -3366,6 +3368,7 @@ Support status: [reserved](#support-status) | quiescent_equals_ticking_range_ids | [int64](#cockroach.server.serverpb.ProblemRangesResponse-int64) | repeated | | [reserved](#support-status) | | raft_log_too_large_range_ids | [int64](#cockroach.server.serverpb.ProblemRangesResponse-int64) | repeated | | [reserved](#support-status) | | circuit_breaker_error_range_ids | [int64](#cockroach.server.serverpb.ProblemRangesResponse-int64) | repeated | | [reserved](#support-status) | +| paused_replica_ids | [int64](#cockroach.server.serverpb.ProblemRangesResponse-int64) | repeated | | [reserved](#support-status) | @@ -3758,6 +3761,7 @@ RangeProblems describes issues reported by a range. For internal use only. | quiescent_equals_ticking | [bool](#cockroach.server.serverpb.RangeResponse-bool) | | Quiescent ranges do not tick by definition, but we track this in two different ways and suspect that they're getting out of sync. If the replica's quiescent flag doesn't agree with the store's list of replicas that are ticking, warn about it. | [reserved](#support-status) | | raft_log_too_large | [bool](#cockroach.server.serverpb.RangeResponse-bool) | | When the raft log is too large, it can be a symptom of other issues. | [reserved](#support-status) | | circuit_breaker_error | [bool](#cockroach.server.serverpb.RangeResponse-bool) | | | [reserved](#support-status) | +| paused_followers | [bool](#cockroach.server.serverpb.RangeResponse-bool) | | | [reserved](#support-status) | diff --git a/docs/generated/swagger/spec.json b/docs/generated/swagger/spec.json index 7ec2c125eab6..41c97cfdb881 100644 --- a/docs/generated/swagger/spec.json +++ b/docs/generated/swagger/spec.json @@ -1257,6 +1257,10 @@ "type": "boolean", "x-go-name": "Overreplicated" }, + "paused_followers": { + "type": "boolean", + "x-go-name": "PausedFollowers" + }, "quiescent_equals_ticking": { "description": "Quiescent ranges do not tick by definition, but we track this in\ntwo different ways and suspect that they're getting out of sync.\nIf the replica's quiescent flag doesn't agree with the store's\nlist of replicas that are ticking, warn about it.", "type": "boolean", diff --git a/pkg/server/problem_ranges.go b/pkg/server/problem_ranges.go index 8c0c24c84d85..c47ecf0c69b5 100644 --- a/pkg/server/problem_ranges.go +++ b/pkg/server/problem_ranges.go @@ -133,6 +133,10 @@ func (s *statusServer) ProblemRanges( problems.CircuitBreakerErrorRangeIDs = append(problems.CircuitBreakerErrorRangeIDs, info.State.Desc.RangeID) } + if info.Problems.PausedFollowers { + problems.PausedReplicaIDs = + append(problems.PausedReplicaIDs, info.State.Desc.RangeID) + } } sort.Sort(roachpb.RangeIDSlice(problems.UnavailableRangeIDs)) sort.Sort(roachpb.RangeIDSlice(problems.RaftLeaderNotLeaseHolderRangeIDs)) @@ -143,6 +147,7 @@ func (s *statusServer) ProblemRanges( sort.Sort(roachpb.RangeIDSlice(problems.QuiescentEqualsTickingRangeIDs)) sort.Sort(roachpb.RangeIDSlice(problems.RaftLogTooLargeRangeIDs)) sort.Sort(roachpb.RangeIDSlice(problems.CircuitBreakerErrorRangeIDs)) + sort.Sort(roachpb.RangeIDSlice(problems.PausedReplicaIDs)) response.ProblemsByNodeID[resp.nodeID] = problems case <-ctx.Done(): return nil, status.Errorf(codes.DeadlineExceeded, ctx.Err().Error()) diff --git a/pkg/server/serverpb/status.proto b/pkg/server/serverpb/status.proto index 93452f3b93d1..54504e884ef1 100644 --- a/pkg/server/serverpb/status.proto +++ b/pkg/server/serverpb/status.proto @@ -389,6 +389,7 @@ message RangeProblems { // When the raft log is too large, it can be a symptom of other issues. bool raft_log_too_large = 7; bool circuit_breaker_error = 9; + bool paused_followers = 10; } // RangeStatistics describes statistics reported by a range. For internal use @@ -1223,6 +1224,11 @@ message ProblemRangesResponse { (gogoproto.casttype) = "github.com/cockroachdb/cockroach/pkg/roachpb.RangeID" ]; + repeated int64 paused_replica_ids = 11 [ + (gogoproto.customname) = "PausedReplicaIDs", + (gogoproto.casttype) = + "github.com/cockroachdb/cockroach/pkg/roachpb.RangeID" + ]; } reserved 1 to 7; // NodeID is the node that submitted all the requests. diff --git a/pkg/server/status.go b/pkg/server/status.go index 73ac3259965d..c2d5b2c581c3 100644 --- a/pkg/server/status.go +++ b/pkg/server/status.go @@ -2045,6 +2045,7 @@ func (s *statusServer) rangesHelper( QuiescentEqualsTicking: raftStatus != nil && metrics.Quiescent == metrics.Ticking, RaftLogTooLarge: metrics.RaftLogTooLarge, CircuitBreakerError: len(state.CircuitBreakerError) > 0, + PausedFollowers: metrics.PausedFollowerCount > 0, }, LeaseStatus: metrics.LeaseStatus, Quiescent: metrics.Quiescent, diff --git a/pkg/ui/workspaces/db-console/src/views/cluster/containers/nodeGraphs/dashboards/graphTooltips.tsx b/pkg/ui/workspaces/db-console/src/views/cluster/containers/nodeGraphs/dashboards/graphTooltips.tsx index 16c436df3799..f562127c9de6 100644 --- a/pkg/ui/workspaces/db-console/src/views/cluster/containers/nodeGraphs/dashboards/graphTooltips.tsx +++ b/pkg/ui/workspaces/db-console/src/views/cluster/containers/nodeGraphs/dashboards/graphTooltips.tsx @@ -165,3 +165,7 @@ export const CircuitBreakerTrippedEventsTooltip: React.FC = () => ( since the process started. ); + +export const PausedFollowersTooltip: React.FC = () => ( +