Skip to content

Commit

Permalink
Merge pull request #119373 from fqazi/backport22.2-119305
Browse files Browse the repository at this point in the history
release-22.2: sql: crdb_internal.leases could cause a deadlock with the lease manager
  • Loading branch information
fqazi authored Feb 21, 2024
2 parents d54cf31 + c1dc400 commit 44a4515
Show file tree
Hide file tree
Showing 2 changed files with 51 additions and 13 deletions.
49 changes: 36 additions & 13 deletions pkg/sql/crdb_internal.go
Original file line number Diff line number Diff line change
Expand Up @@ -811,9 +811,14 @@ CREATE TABLE crdb_internal.schema_changes (
},
}

type crdbInternalLeasesTableEntry struct {
desc catalog.Descriptor
takenOffline bool
expiration tree.DTimestamp
}

// TODO(tbg): prefix with node_.
var crdbInternalLeasesTable = virtualSchemaTable{
comment: `acquired table leases (RAM; local node only)`,
schema: `
CREATE TABLE crdb_internal.leases (
node_id INT NOT NULL,
Expand All @@ -823,27 +828,45 @@ CREATE TABLE crdb_internal.leases (
expiration TIMESTAMP NOT NULL,
deleted BOOL NOT NULL
)`,
comment: `acquired table leases (RAM; local node only)`,
populate: func(
ctx context.Context, p *planner, _ catalog.DatabaseDescriptor, addRow func(...tree.Datum) error,
) (err error) {
nodeID, _ := p.execCfg.NodeInfo.NodeID.OptionalNodeID() // zero if not available
var leaseEntries []crdbInternalLeasesTableEntry
p.LeaseMgr().VisitLeases(func(desc catalog.Descriptor, takenOffline bool, _ int, expiration tree.DTimestamp) (wantMore bool) {
if p.CheckAnyPrivilege(ctx, desc) != nil {
// Because we have locked the lease manager while visiting every lease,
// it not safe to *acquire* or *release* any leases in the process. As
// a result, build an in memory cache of entries and process them after
// all the locks have been released. Previously we would check privileges,
// which would need to get the lease on the role_member table. Simply skipping
// this check on that table will not be sufficient since any active lease
// on it could expire or need an renewal and cause the sample problem.
leaseEntries = append(leaseEntries, crdbInternalLeasesTableEntry{
desc: desc,
takenOffline: takenOffline,
expiration: expiration,
})
return true
})
for _, entry := range leaseEntries {
if p.CheckAnyPrivilege(ctx, entry.desc) != nil {
// TODO(ajwerner): inspect what type of error got returned.
return true
continue
}

err = addRow(
if err := addRow(
tree.NewDInt(tree.DInt(nodeID)),
tree.NewDInt(tree.DInt(int64(desc.GetID()))),
tree.NewDString(desc.GetName()),
tree.NewDInt(tree.DInt(int64(desc.GetParentID()))),
&expiration,
tree.MakeDBool(tree.DBool(takenOffline)),
)
return err == nil
})
return err
tree.NewDInt(tree.DInt(int64(entry.desc.GetID()))),
tree.NewDString(entry.desc.GetName()),
tree.NewDInt(tree.DInt(int64(entry.desc.GetParentID()))),
&entry.expiration,
tree.MakeDBool(tree.DBool(entry.takenOffline)),
); err != nil {
return err
}
}
return nil
},
}

Expand Down
15 changes: 15 additions & 0 deletions pkg/sql/logictest/testdata/logic_test/crdb_internal
Original file line number Diff line number Diff line change
Expand Up @@ -1374,3 +1374,18 @@ CREATE TABLE t76710_1 AS SELECT * FROM crdb_internal.statement_statistics;

statement ok
CREATE MATERIALIZED VIEW t76710_2 AS SELECT fingerprint_id FROM crdb_internal.cluster_statement_statistics;

# In #119253 we observed a deadlock when visiting leases inside crdb_internal.lease
# between the lease manager and the authorization check for each descriptor. This
# test validates that this is no longer the case.
subtest allow_role_memberships_to_change_during_transaction

user testuser

statement ok
set allow_role_memberships_to_change_during_transaction=true

statement ok
SELECT * FROM crdb_internal.leases;

subtest end

0 comments on commit 44a4515

Please sign in to comment.