Skip to content

Commit

Permalink
kvserver: read lease under mutex when switching lease type
Browse files Browse the repository at this point in the history
A race could occur when a replica queue and post lease application both
attempted to switch the lease type. This race would cause the queue to
not process the replica because the lease type had already changed. As a
result, lease preference violations might not have been quickly
resolved by the lease queue.

Read the lease under the same mutex used for requesting the lease, when
possibly switching the lease type.

Resolves: cockroachdb#123998
Release note: None
  • Loading branch information
kvoli committed May 16, 2024
1 parent 28bce06 commit 574f667
Show file tree
Hide file tree
Showing 2 changed files with 19 additions and 12 deletions.
4 changes: 2 additions & 2 deletions pkg/kv/kvserver/queue.go
Original file line number Diff line number Diff line change
Expand Up @@ -1058,7 +1058,7 @@ func (bq *baseQueue) replicaCanBeProcessed(
// and renew or acquire if necessary.
if bq.needsLease {
if acquireLeaseIfNeeded {
leaseStatus, pErr := repl.redirectOnOrAcquireLease(ctx)
_, pErr := repl.redirectOnOrAcquireLease(ctx)
if pErr != nil {
switch v := pErr.GetDetail().(type) {
case *kvpb.NotLeaseHolderError, *kvpb.RangeNotFoundError:
Expand All @@ -1071,7 +1071,7 @@ func (bq *baseQueue) replicaCanBeProcessed(

// TODO(baptist): Should this be added to replicaInQueue?
realRepl, _ := repl.(*Replica)
pErr = realRepl.maybeSwitchLeaseType(ctx, leaseStatus)
pErr = realRepl.maybeSwitchLeaseType(ctx)
if pErr != nil {
return nil, pErr.GoError()
}
Expand Down
27 changes: 17 additions & 10 deletions pkg/kv/kvserver/replica_range_lease.go
Original file line number Diff line number Diff line change
Expand Up @@ -1610,17 +1610,24 @@ func (r *Replica) shouldRequestLeaseRLocked(
// maybeSwitchLeaseType will synchronously renew a lease using the appropriate
// type if it is (or was) owned by this replica and has an incorrect type. This
// typically happens when changing kv.expiration_leases_only.enabled.
func (r *Replica) maybeSwitchLeaseType(ctx context.Context, st kvserverpb.LeaseStatus) *kvpb.Error {
if !st.OwnedBy(r.store.StoreID()) {
return nil
}
func (r *Replica) maybeSwitchLeaseType(ctx context.Context) *kvpb.Error {
llHandle := func() *leaseRequestHandle {
now := r.store.Clock().NowAsClockTimestamp()
// The lease status needs to be checked and requested under the same lock,
// to avoid an interleaving lease request changing the lease between the
// two.
r.mu.Lock()
defer r.mu.Unlock()

var llHandle *leaseRequestHandle
r.mu.Lock()
if !r.hasCorrectLeaseTypeRLocked(st.Lease) {
llHandle = r.requestLeaseLocked(ctx, st, nil /* limiter */)
}
r.mu.Unlock()
st := r.leaseStatusAtRLocked(ctx, now)
if !st.OwnedBy(r.store.StoreID()) {
return nil
}
if r.hasCorrectLeaseTypeRLocked(st.Lease) {
return nil
}
return r.requestLeaseLocked(ctx, st, nil /* limiter */)
}()

if llHandle != nil {
select {
Expand Down

0 comments on commit 574f667

Please sign in to comment.