-
Notifications
You must be signed in to change notification settings - Fork 3.8k
/
Copy pathconstants.go
473 lines (440 loc) · 21.3 KB
/
constants.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
// Copyright 2015 The Cockroach Authors.
//
// Use of this software is governed by the Business Source License
// included in the file licenses/BSL.txt.
//
// As of the Change Date specified in that file, in accordance with
// the Business Source License, use of this software will be governed
// by the Apache License, Version 2.0, included in the file
// licenses/APL.txt.
package keys
import (
"math"
"github.com/cockroachdb/cockroach/pkg/roachpb"
)
// For a high-level overview of the keyspace layout, see the package comment in
// doc.go.
// These constants are single bytes for performance. They allow single-byte
// comparisons which are considerably faster than bytes.HasPrefix.
const (
meta1PrefixByte = roachpb.LocalMaxByte
meta2PrefixByte = '\x03'
metaMaxByte = '\x04'
systemPrefixByte = metaMaxByte
systemMaxByte = '\x05'
tenantPrefixByte = '\xfe'
)
// Constants for system-reserved keys in the KV map.
//
// Note: Preserve group-wise ordering when adding new constants.
// Note: Update `keymap` in doc.go when adding new constants.
var (
// MinKey is a minimum key value which sorts before all other keys.
MinKey = roachpb.KeyMin
// MaxKey is the infinity marker which is larger than any other key.
MaxKey = roachpb.KeyMax
// LocalPrefix is the prefix for all local keys.
LocalPrefix = roachpb.LocalPrefix
// LocalMax is the end of the local key range. It is itself a global key.
LocalMax = roachpb.LocalMax
// localSuffixLength specifies the length in bytes of all local
// key suffixes.
localSuffixLength = 4
// There are five types of local key data enumerated below: replicated
// range-ID, unreplicated range-ID, range local, store-local, and range lock
// keys.
// 1. Replicated Range-ID keys
//
// LocalRangeIDPrefix is the prefix identifying per-range data
// indexed by Range ID. The Range ID is appended to this prefix,
// encoded using EncodeUvarint. The specific sort of per-range
// metadata is identified by one of the suffixes listed below, along
// with potentially additional encoded key info, for instance in the
// case of AbortSpan entry.
LocalRangeIDPrefix = roachpb.RKey(makeKey(LocalPrefix, roachpb.Key("i")))
// LocalRangeIDReplicatedInfix is the post-Range ID specifier for all Raft
// replicated per-range data. By appending this after the Range ID, these
// keys will be sorted directly before the local unreplicated keys for the
// same Range ID, so they can be manipulated either together or individually
// in a single scan.
LocalRangeIDReplicatedInfix = []byte("r")
// LocalAbortSpanSuffix is the suffix for AbortSpan entries. The
// AbortSpan protects a transaction from re-reading its own intents
// after it's been aborted.
LocalAbortSpanSuffix = []byte("abc-")
// localRangeFrozenStatusSuffix is DEPRECATED and remains to prevent reuse.
localRangeFrozenStatusSuffix = []byte("fzn-")
// LocalRangeGCThresholdSuffix is the suffix for the GC threshold. It keeps
// the lgc- ("last GC") representation for backwards compatibility.
LocalRangeGCThresholdSuffix = []byte("lgc-")
// LocalRangeAppliedStateSuffix is the suffix for the range applied state
// key.
LocalRangeAppliedStateSuffix = []byte("rask")
// LocalRaftTruncatedStateSuffix is the suffix for the
// RaftTruncatedState.
// Note: This suffix is also used for unreplicated Range-ID keys.
LocalRaftTruncatedStateSuffix = []byte("rftt")
// LocalRangeLeaseSuffix is the suffix for a range lease.
LocalRangeLeaseSuffix = []byte("rll-")
// LocalRangePriorReadSummarySuffix is the suffix for a range's prior read
// summary.
LocalRangePriorReadSummarySuffix = []byte("rprs")
// LocalRangeVersionSuffix is the suffix for the range version.
LocalRangeVersionSuffix = []byte("rver")
// LocalRangeStatsLegacySuffix is the suffix for range statistics.
LocalRangeStatsLegacySuffix = []byte("stat")
// localTxnSpanGCThresholdSuffix is DEPRECATED and remains to prevent reuse.
localTxnSpanGCThresholdSuffix = []byte("tst-")
// 2. Unreplicated Range-ID keys
//
// localRangeIDUnreplicatedInfix is the post-Range ID specifier for all
// per-range data that is not fully Raft replicated. By appending this
// after the Range ID, these keys will be sorted directly after the local
// replicated keys for the same Range ID, so they can be manipulated either
// together or individually in a single scan.
localRangeIDUnreplicatedInfix = []byte("u")
// LocalRangeTombstoneSuffix is the suffix for the range tombstone.
//
// NB: This suffix was originally named LocalRaftTombstoneSuffix, which is
// why it starts off with "rft" as opposed to "rl".
LocalRangeTombstoneSuffix = []byte("rftb")
// LocalRaftHardStateSuffix is the Suffix for the raft HardState.
LocalRaftHardStateSuffix = []byte("rfth")
// localRaftLastIndexSuffix is DEPRECATED and remains to prevent reuse.
localRaftLastIndexSuffix = []byte("rfti")
// LocalRaftLogSuffix is the suffix for the raft log.
LocalRaftLogSuffix = []byte("rftl")
// LocalRangeLastReplicaGCTimestampSuffix is the suffix for a range's last
// replica GC timestamp (for GC of old replicas).
LocalRangeLastReplicaGCTimestampSuffix = []byte("rlrt")
// localRangeLastVerificationTimestampSuffix is DEPRECATED and remains to
// prevent reuse.
localRangeLastVerificationTimestampSuffix = []byte("rlvt")
// 3. Range local keys
//
// LocalRangePrefix is the prefix identifying per-range data indexed
// by range key (either start key, or some key in the range). The
// key is appended to this prefix, encoded using EncodeBytes. The
// specific sort of per-range metadata is identified by one of the
// suffixes listed below, along with potentially additional encoded
// key info, such as the txn ID in the case of a transaction record.
LocalRangePrefix = roachpb.Key(makeKey(LocalPrefix, roachpb.RKey("k")))
LocalRangeMax = LocalRangePrefix.PrefixEnd()
// LocalRangeProbeSuffix is the suffix for keys for probing.
LocalRangeProbeSuffix = roachpb.RKey("prbe")
// LocalQueueLastProcessedSuffix is the suffix for replica queue state keys.
LocalQueueLastProcessedSuffix = roachpb.RKey("qlpt")
// LocalRangeDescriptorSuffix is the suffix for keys storing
// range descriptors. The value is a struct of type RangeDescriptor.
LocalRangeDescriptorSuffix = roachpb.RKey("rdsc")
// LocalTransactionSuffix specifies the key suffix for
// transaction records. The additional detail is the transaction id.
LocalTransactionSuffix = roachpb.RKey("txn-")
// 4. Store local keys
//
// LocalStorePrefix is the prefix identifying per-store data.
LocalStorePrefix = makeKey(LocalPrefix, roachpb.Key("s"))
// localStoreClusterVersionSuffix stores the cluster-wide version
// information for this store, updated any time the operator
// updates the minimum cluster version.
localStoreClusterVersionSuffix = []byte("cver")
// localStoreGossipSuffix stores gossip bootstrap metadata for this
// store, updated any time new gossip hosts are encountered.
localStoreGossipSuffix = []byte("goss")
// localStoreHLCUpperBoundSuffix stores an upper bound to the wall time used by
// the HLC.
localStoreHLCUpperBoundSuffix = []byte("hlcu")
// localStoreIdentSuffix stores an immutable identifier for this
// store, created when the store is first bootstrapped.
localStoreIdentSuffix = []byte("iden")
// localStoreNodeTombstoneSuffix stores key value pairs that map
// nodeIDs to time of removal from cluster.
localStoreNodeTombstoneSuffix = []byte("ntmb")
// localStoreLastUpSuffix stores the last timestamp that a store's node
// acknowledged that it was still running. This value will be regularly
// refreshed on all stores for a running node; the intention of this value
// is to allow a restarting node to discover approximately how long it has
// been down without needing to retrieve liveness records from the cluster.
localStoreLastUpSuffix = []byte("uptm")
// localRemovedLeakedRaftEntriesSuffix is DEPRECATED and remains to prevent
// reuse.
localRemovedLeakedRaftEntriesSuffix = []byte("dlre")
// localStoreCachedSettingsSuffix stores the cached settings for node.
localStoreCachedSettingsSuffix = []byte("stng")
// LocalStoreCachedSettingsKeyMin is the start of span of possible cached settings keys.
LocalStoreCachedSettingsKeyMin = MakeStoreKey(localStoreCachedSettingsSuffix, nil)
// LocalStoreCachedSettingsKeyMax is the end of span of possible cached settings keys.
LocalStoreCachedSettingsKeyMax = LocalStoreCachedSettingsKeyMin.PrefixEnd()
// LocalStoreUnsafeReplicaRecoverySuffix suffix for record entries put
// when loss of quorum recovery operations are performed offline on the store.
localStoreUnsafeReplicaRecoverySuffix = []byte("loqr")
// LocalStoreUnsafeReplicaRecoveryKeyMin is the start of keyspace used to store
// replica LOQ recovery keys.
LocalStoreUnsafeReplicaRecoveryKeyMin = MakeStoreKey(localStoreUnsafeReplicaRecoverySuffix, nil)
// LocalStoreUnsafeReplicaRecoveryKeyMax is the end of keyspace used to store replica
// LOQ recovery keys.
LocalStoreUnsafeReplicaRecoveryKeyMax = LocalStoreUnsafeReplicaRecoveryKeyMin.PrefixEnd()
// 5. Lock table keys
//
// LocalRangeLockTablePrefix specifies the key prefix for the lock
// table. It is immediately followed by the LockTableSingleKeyInfix,
// and then the key being locked.
//
// The lock strength and txn UUID are not in the part of the key that
// the keys package deals with. They are in the versioned part of the
// key (see EngineKey.Version). This permits the storage engine to use
// bloom filters when searching for all locks for a lockable key.
//
// Different lock strengths may use different value types. The exclusive
// lock strength uses MVCCMetadata as the value type, since it does
// double duty as a reference to a provisional MVCC value.
// TODO(sumeer): remember to adjust this comment when adding locks of
// other strengths, or range locks.
LocalRangeLockTablePrefix = roachpb.Key(makeKey(LocalPrefix, roachpb.RKey("z")))
LockTableSingleKeyInfix = []byte("k")
// LockTableSingleKeyStart is the inclusive start key of the key range
// containing single key locks.
LockTableSingleKeyStart = roachpb.Key(makeKey(LocalRangeLockTablePrefix, LockTableSingleKeyInfix))
// LockTableSingleKeyEnd is the exclusive end key of the key range
// containing single key locks.
LockTableSingleKeyEnd = roachpb.Key(
makeKey(LocalRangeLockTablePrefix, roachpb.Key(LockTableSingleKeyInfix).PrefixEnd()))
// The global keyspace includes the meta{1,2}, system, system tenant SQL
// keys, and non-system tenant SQL keys.
// 1. Meta keys
//
// MetaMin is the start of the range of addressing keys.
MetaMin = Meta1Prefix
// MetaMax is the end of the range of addressing keys.
MetaMax = roachpb.Key{metaMaxByte}
// Meta1Prefix is the first level of key addressing. It is selected such that
// all range addressing records sort before any system tables which they
// might describe. The value is a RangeDescriptor struct.
Meta1Prefix = roachpb.Key{meta1PrefixByte}
// Meta1KeyMax is the end of the range of the first level of key addressing.
// The value is a RangeDescriptor struct.
Meta1KeyMax = roachpb.Key(makeKey(Meta1Prefix, roachpb.RKeyMax))
// Meta2Prefix is the second level of key addressing. The value is a
// RangeDescriptor struct.
Meta2Prefix = roachpb.Key{meta2PrefixByte}
// Meta2KeyMax is the end of the range of the second level of key addressing.
// The value is a RangeDescriptor struct.
Meta2KeyMax = roachpb.Key(makeKey(Meta2Prefix, roachpb.RKeyMax))
// 2. System keys
//
// SystemPrefix indicates the beginning of the key range for
// global, system data which are replicated across the cluster.
SystemPrefix = roachpb.Key{systemPrefixByte}
SystemMax = roachpb.Key{systemMaxByte}
// NodeLivenessPrefix specifies the key prefix for the node liveness
// table. Note that this should sort before the rest of the system
// keyspace in order to limit the number of ranges which must use
// expiration-based range leases instead of the more efficient
// node-liveness epoch-based range leases (see
// https://github.com/cockroachdb/cockroach/blob/master/docs/RFCS/20160210_range_leases.md)
NodeLivenessPrefix = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("\x00liveness-")))
// NodeLivenessKeyMax is the maximum value for any node liveness key.
NodeLivenessKeyMax = NodeLivenessPrefix.PrefixEnd()
//
// BootstrapVersionKey is the key at which clusters bootstrapped with a version
// > 1.0 persist the version at which they were bootstrapped.
BootstrapVersionKey = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("bootstrap-version")))
//
// descIDGenerator is the global descriptor ID generator sequence used for
// table and namespace IDs for the system tenant. All other tenants use a
// SQL sequence for this purpose. See sqlEncoder.DescIDSequenceKey.
descIDGenerator = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("desc-idgen")))
// NodeIDGenerator is the global node ID generator sequence.
NodeIDGenerator = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("node-idgen")))
// RangeIDGenerator is the global range ID generator sequence.
RangeIDGenerator = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("range-idgen")))
// StoreIDGenerator is the global store ID generator sequence.
StoreIDGenerator = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("store-idgen")))
//
// StatusPrefix specifies the key prefix to store all status details.
StatusPrefix = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("status-")))
// StatusNodePrefix stores all status info for nodes.
StatusNodePrefix = roachpb.Key(makeKey(StatusPrefix, roachpb.RKey("node-")))
//
// MigrationPrefix specifies the key prefix to store all migration details.
MigrationPrefix = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("system-version/")))
// MigrationLease is the key that nodes must take a lease on in order to run
// system migrations on the cluster.
MigrationLease = roachpb.Key(makeKey(MigrationPrefix, roachpb.RKey("lease")))
//
// TimeseriesPrefix is the key prefix for all timeseries data.
TimeseriesPrefix = roachpb.Key(makeKey(SystemPrefix, roachpb.RKey("tsd")))
// TimeseriesKeyMax is the maximum value for any timeseries data.
TimeseriesKeyMax = TimeseriesPrefix.PrefixEnd()
// 3. System tenant SQL keys
//
// TODO(nvanbenschoten): Figure out what to do with all of these. At a
// minimum, prefix them all with "System".
// TableDataMin is the start of the range of table data keys.
TableDataMin = SystemSQLCodec.TablePrefix(0)
// TableDataMax is the end of the range of table data keys.
TableDataMax = SystemSQLCodec.TablePrefix(math.MaxUint32).PrefixEnd()
// ScratchRangeMin is a key used in tests to write arbitrary data without
// overlapping with meta, system or tenant ranges.
ScratchRangeMin = TableDataMax
//
// SystemConfigSplitKey is the key to split at immediately prior to the
// system config span. NB: Split keys need to be valid column keys.
// TODO(bdarnell): this should be either roachpb.Key or RKey, not []byte.
SystemConfigSplitKey = []byte(TableDataMin)
// SystemConfigTableDataMax is the end key of system config span.
SystemConfigTableDataMax = SystemSQLCodec.TablePrefix(MaxSystemConfigDescID + 1)
//
// NamespaceTableMin is the start key of system.namespace, which is a system
// table that does not reside in the same range as other system tables.
NamespaceTableMin = SystemSQLCodec.TablePrefix(NamespaceTableID)
// NamespaceTableMax is the end key of system.namespace.
NamespaceTableMax = SystemSQLCodec.TablePrefix(NamespaceTableID + 1)
//
// UserTableDataMin is the start key of user structured data.
UserTableDataMin = SystemSQLCodec.TablePrefix(MinUserDescID)
// 4. Non-system tenant SQL keys
//
// TenantPrefix is the prefix for all non-system tenant keys.
TenantPrefix = roachpb.Key{tenantPrefixByte}
TenantTableDataMin = MakeTenantPrefix(roachpb.MinTenantID)
TenantTableDataMax = MakeTenantPrefix(roachpb.MaxTenantID).PrefixEnd()
)
// Various IDs used by the structured data layer.
// NOTE: these must not change during the lifetime of a cluster.
const (
// MaxSystemConfigDescID is the maximum system descriptor ID that will be
// gossiped as part of the SystemConfig. Be careful adding new descriptors to
// this ID range.
MaxSystemConfigDescID = 10
// MaxReservedDescID is the maximum value of reserved descriptor
// IDs. Reserved IDs are used by namespaces and tables used internally by
// cockroach.
MaxReservedDescID = 49
// MinUserDescID is the first descriptor ID available for user
// structured data.
MinUserDescID = MaxReservedDescID + 1
// MinNonPredefinedUserDescID is the first descriptor ID used by
// user-level objects that are not created automatically on empty
// clusters (default databases).
// Two default databases and two public schemas are created by default using
// 4 ids.
MinNonPredefinedUserDescID = MinUserDescID + 4
// RootNamespaceID is the ID of the root namespace.
RootNamespaceID = 0
// SystemDatabaseID and following are the database/table IDs for objects
// in the system span.
// NOTE: IDs must be <= MaxSystemConfigDescID.
SystemDatabaseID = 1
// DeprecatedNamespaceTableID was the tableID for the system.namespace table
// for pre-20.1 clusters.
DeprecatedNamespaceTableID = 2
DescriptorTableID = 3
UsersTableID = 4
ZonesTableID = 5
SettingsTableID = 6
DescIDSequenceID = 7
TenantsTableID = 8
// IDs for the important columns and indexes in the zones table live here to
// avoid introducing a dependency on sql/sqlbase throughout the codebase.
ZonesTablePrimaryIndexID = 1
ZonesTableConfigColumnID = 2
ZonesTableConfigColFamID = 2
DescriptorTablePrimaryKeyIndexID = 1
DescriptorTableDescriptorColID = 2
DescriptorTableDescriptorColFamID = 2
TenantsTablePrimaryKeyIndexID = 1
SpanConfigurationsTablePrimaryKeyIndexID = 1
// Reserved IDs for other system tables. Note that some of these IDs refer
// to "Ranges" instead of a Table - these IDs are needed to store custom
// configuration for non-table ranges (e.g. Zone Configs).
// NOTE: IDs must be <= MaxReservedDescID.
LeaseTableID = 11
EventLogTableID = 12
RangeEventTableID = 13
UITableID = 14
JobsTableID = 15
MetaRangesID = 16 // pseudo
SystemRangesID = 17 // pseudo
TimeseriesRangesID = 18 // pseudo
WebSessionsTableID = 19
TableStatisticsTableID = 20
LocationsTableID = 21
LivenessRangesID = 22 // pseudo
RoleMembersTableID = 23
CommentsTableID = 24
ReplicationConstraintStatsTableID = 25
ReplicationCriticalLocalitiesTableID = 26
ReplicationStatsTableID = 27
ReportsMetaTableID = 28
// PublicSchemaID refers to old references where Public schemas are
// descriptorless.
// TODO(richardjcai): This should be fully removed in 22.2.
PublicSchemaID = 29 // pseudo
// PublicSchemaIDForBackup is used temporarily to determine cases of
// PublicSchemaID being used for backup.
// We need to keep this around since backups created prior to 22.1 use 29
// as the ID for a virtual public schema. In restores, we look for this 29
// and synthesize a public schema with a descriptor when necessary.
PublicSchemaIDForBackup = 29
// SystemPublicSchemaID represents the ID used for the pseudo public
// schema in the system database.
SystemPublicSchemaID = 29 // pseudo
// New NamespaceTableID for cluster version >= 20.1
// Ensures that NamespaceTable does not get gossiped again
NamespaceTableID = 30
ProtectedTimestampsMetaTableID = 31
ProtectedTimestampsRecordsTableID = 32
RoleOptionsTableID = 33
StatementBundleChunksTableID = 34
StatementDiagnosticsRequestsTableID = 35
StatementDiagnosticsTableID = 36
ScheduledJobsTableID = 37
TenantsRangesID = 38 // pseudo
SqllivenessID = 39
MigrationsID = 40
JoinTokensTableID = 41
StatementStatisticsTableID = 42
TransactionStatisticsTableID = 43
DatabaseRoleSettingsTableID = 44
TenantUsageTableID = 45
SQLInstancesTableID = 46
SpanConfigurationsTableID = 47
// CommentType is type for system.comments
DatabaseCommentType = 0
TableCommentType = 1
ColumnCommentType = 2
IndexCommentType = 3
SchemaCommentType = 4
ConstraintCommentType = 5
)
const (
// SequenceIndexID is the ID of the single index on each special single-column,
// single-row sequence table.
SequenceIndexID = 1
// SequenceColumnFamilyID is the ID of the column family on each special single-column,
// single-row sequence table.
SequenceColumnFamilyID = 0
)
// PseudoTableIDs is the list of ids from above that are not real tables (i.e.
// there's no table descriptor). They're grouped here because the cluster
// bootstrap process needs to create splits for them; splits for the tables
// happen separately.
var PseudoTableIDs = []uint32{
MetaRangesID,
SystemRangesID,
TimeseriesRangesID,
LivenessRangesID,
PublicSchemaID,
TenantsRangesID,
}
// MaxPseudoTableID is the largest ID in PseudoTableIDs.
var MaxPseudoTableID = func() uint32 {
var max uint32
for _, id := range PseudoTableIDs {
if max < id {
max = id
}
}
return max
}()