-
Notifications
You must be signed in to change notification settings - Fork 3.8k
/
virtual_schema.go
1020 lines (923 loc) · 34.9 KB
/
virtual_schema.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
// Copyright 2016 The Cockroach Authors.
//
// Use of this software is governed by the Business Source License
// included in the file licenses/BSL.txt.
//
// As of the Change Date specified in that file, in accordance with
// the Business Source License, use of this software will be governed
// by the Apache License, Version 2.0, included in the file
// licenses/APL.txt.
package sql
import (
"context"
"fmt"
"math"
"sort"
"time"
"github.com/cockroachdb/cockroach/pkg/security/username"
"github.com/cockroachdb/cockroach/pkg/settings/cluster"
"github.com/cockroachdb/cockroach/pkg/sql/catalog"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/catpb"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/catsessiondata"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/colinfo"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/descpb"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/descs"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/schemadesc"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/schemaexpr"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/tabledesc"
"github.com/cockroachdb/cockroach/pkg/sql/catalog/typedesc"
"github.com/cockroachdb/cockroach/pkg/sql/opt/constraint"
"github.com/cockroachdb/cockroach/pkg/sql/parser"
"github.com/cockroachdb/cockroach/pkg/sql/pgwire/pgcode"
"github.com/cockroachdb/cockroach/pkg/sql/pgwire/pgerror"
"github.com/cockroachdb/cockroach/pkg/sql/privilege"
"github.com/cockroachdb/cockroach/pkg/sql/sem/catconstants"
"github.com/cockroachdb/cockroach/pkg/sql/sem/eval"
"github.com/cockroachdb/cockroach/pkg/sql/sem/tree"
"github.com/cockroachdb/cockroach/pkg/sql/sessiondata"
"github.com/cockroachdb/cockroach/pkg/sql/sqlerrors"
"github.com/cockroachdb/cockroach/pkg/sql/sqltelemetry"
"github.com/cockroachdb/cockroach/pkg/util/errorutil/unimplemented"
"github.com/cockroachdb/cockroach/pkg/util/hlc"
"github.com/cockroachdb/cockroach/pkg/util/iterutil"
"github.com/cockroachdb/cockroach/pkg/util/stop"
"github.com/cockroachdb/errors"
)
const virtualSchemaNotImplementedMessage = "virtual schema table not implemented: %s.%s"
//
// Programmer interface to define virtual schemas.
//
// virtualSchema represents a database with a set of virtual tables. Virtual
// tables differ from standard tables in that they are not persisted to storage,
// and instead their contents are populated whenever they are queried.
//
// The virtual database and its virtual tables also differ from standard databases
// and tables in that their descriptors are not distributed, but instead live statically
// in code. This means that they are accessed separately from standard descriptors.
type virtualSchema struct {
name string
undefinedTables map[string]struct{}
tableDefs map[descpb.ID]virtualSchemaDef
tableValidator func(*descpb.TableDescriptor) error // optional
// Some virtual tables can be used if there is no current database set; others can't.
validWithNoDatabaseContext bool
// Some virtual schemas (like pg_catalog) contain types that we can resolve.
containsTypes bool
}
// virtualSchemaDef represents the interface of a table definition within a virtualSchema.
type virtualSchemaDef interface {
getSchema() string
initVirtualTableDesc(
ctx context.Context, st *cluster.Settings, sc catalog.SchemaDescriptor, id descpb.ID,
) (descpb.TableDescriptor, error)
getComment() string
isUnimplemented() bool
}
type virtualIndex struct {
// populate populates the table given the constraint. matched is true if any
// rows were generated.
// unwrappedConstraint is unwrapped and never tree.DNull.
populate func(
ctx context.Context,
unwrappedConstraint tree.Datum,
p *planner,
db catalog.DatabaseDescriptor,
addRow func(...tree.Datum) error,
) (matched bool, err error)
// incomplete is true if the virtual index isn't able to satisfy all constraints.
// For example, the pg_class table contains both indexes and tables. Tables
// can be looked up via a virtual index, since we can look up their descriptor
// by their ID directly. But indexes can't - they're hashed identifiers with
// no actual index. So we mark this index as incomplete, and if we get no match
// during populate, we'll fall back on populating the entire table.
incomplete bool
}
// virtualSchemaTable represents a table within a virtualSchema.
type virtualSchemaTable struct {
// Exactly one of the populate and generator fields should be defined for
// each virtualSchemaTable.
schema string
// comment represents comment of virtual schema table.
comment string
// populate, if non-nil, is a function that is used when creating a
// valuesNode. This function eagerly loads every row of the virtual table
// during initialization of the valuesNode.
populate func(ctx context.Context, p *planner, db catalog.DatabaseDescriptor, addRow func(...tree.Datum) error) error
// indexes, if non empty, is a slice of populate methods that also take a
// constraint, only generating rows that match the constraint. The order of
// indexes must match the order of the index definitions in the virtual table's
// schema.
indexes []virtualIndex
// generator, if non-nil, is a function that is used when creating a
// virtualTableNode. This function returns a virtualTableGenerator function
// which generates the next row of the virtual table when called.
generator func(ctx context.Context, p *planner, db catalog.DatabaseDescriptor, stopper *stop.Stopper) (virtualTableGenerator, cleanupFunc, error)
// unimplemented indicates that we do not yet implement the contents of this
// table. If the stub_catalog_tables session variable is enabled, the table
// will be queryable but return no rows. Otherwise querying the table will
// return an unimplemented error.
unimplemented bool
// resultColumns is optional; if present, it will be checked for coherency
// with schema.
resultColumns colinfo.ResultColumns
}
// virtualSchemaView represents a view within a virtualSchema
type virtualSchemaView struct {
schema string
resultColumns colinfo.ResultColumns
// comment represents comment of virtual schema view.
comment string
}
// getSchema is part of the virtualSchemaDef interface.
func (t virtualSchemaTable) getSchema() string {
return t.schema
}
// initVirtualTableDesc is part of the virtualSchemaDef interface.
func (t virtualSchemaTable) initVirtualTableDesc(
ctx context.Context, st *cluster.Settings, sc catalog.SchemaDescriptor, id descpb.ID,
) (descpb.TableDescriptor, error) {
stmt, err := parser.ParseOne(t.schema)
if err != nil {
return descpb.TableDescriptor{}, err
}
create := stmt.AST.(*tree.CreateTable)
var firstColDef *tree.ColumnTableDef
for _, def := range create.Defs {
if d, ok := def.(*tree.ColumnTableDef); ok {
if d.HasDefaultExpr() {
return descpb.TableDescriptor{},
errors.Errorf("virtual tables are not allowed to use default exprs "+
"because bootstrapping: %s:%s", &create.Table, d.Name)
}
if firstColDef == nil {
firstColDef = d
}
}
if _, ok := def.(*tree.UniqueConstraintTableDef); ok {
return descpb.TableDescriptor{},
errors.Errorf("virtual tables are not allowed to have unique constraints")
}
}
if firstColDef == nil {
return descpb.TableDescriptor{},
errors.Errorf("can't have empty virtual tables")
}
// Virtual tables never use SERIAL so we need not process SERIAL
// types here.
semaCtx := tree.MakeSemaContext()
mutDesc, err := NewTableDesc(
ctx,
nil, /* txn */
nil, /* vs */
st,
create,
nil,
sc,
id,
nil, /* regionConfig */
startTime, /* creationTime */
catpb.NewPrivilegeDescriptor(
username.PublicRoleName(),
privilege.List{privilege.SELECT},
privilege.List{},
username.NodeUserName(),
),
nil, /* affected */
&semaCtx, /* semaCtx */
// We explicitly pass in a half-baked EvalContext because we don't need to
// evaluate any expressions to initialize virtual tables. We do need to
// pass in the cluster settings to make sure that functions can properly
// evaluate version gates, though.
&eval.Context{Settings: st}, /* evalCtx */
&sessiondata.SessionData{}, /* sessionData */
tree.PersistencePermanent,
)
if err != nil {
err = errors.Wrapf(err, "initVirtualDesc problem with schema: \n%s", t.schema)
return descpb.TableDescriptor{}, err
}
if t.resultColumns != nil {
if len(mutDesc.Columns) != len(t.resultColumns) {
return descpb.TableDescriptor{}, errors.AssertionFailedf(
"virtual table %s.%s declares incorrect number of columns: %d vs %d",
sc.GetName(), mutDesc.GetName(),
len(mutDesc.Columns), len(t.resultColumns))
}
for i := range mutDesc.Columns {
if mutDesc.Columns[i].Name != t.resultColumns[i].Name ||
mutDesc.Columns[i].Hidden != t.resultColumns[i].Hidden ||
mutDesc.Columns[i].Type.String() != t.resultColumns[i].Typ.String() {
return descpb.TableDescriptor{}, errors.AssertionFailedf(
"virtual table %s.%s declares incorrect column metadata: %#v vs %#v",
sc.GetName(), mutDesc.GetName(),
mutDesc.Columns[i], t.resultColumns[i])
}
}
}
if t.generator != nil {
for _, idx := range t.indexes {
if idx.incomplete {
return descpb.TableDescriptor{}, errors.AssertionFailedf(
"virtual table %s.%s contains an incomplete index and a generator will"+
" never use the index", sc.GetName(), mutDesc.GetName(),
)
}
}
}
for _, index := range mutDesc.PublicNonPrimaryIndexes() {
if index.NumKeyColumns() > 1 {
panic("we don't know how to deal with virtual composite indexes yet")
}
idx := index.IndexDescDeepCopy()
idx.StoreColumnNames, idx.StoreColumnIDs = nil, nil
publicColumns := mutDesc.PublicColumns()
presentInIndex := catalog.MakeTableColSet(idx.KeyColumnIDs...)
for _, col := range publicColumns {
if col.IsVirtual() || presentInIndex.Contains(col.GetID()) {
continue
}
idx.StoreColumnIDs = append(idx.StoreColumnIDs, col.GetID())
idx.StoreColumnNames = append(idx.StoreColumnNames, col.GetName())
}
mutDesc.SetPublicNonPrimaryIndex(index.Ordinal(), idx)
}
return mutDesc.TableDescriptor, nil
}
// getComment is part of the virtualSchemaDef interface.
func (t virtualSchemaTable) getComment() string {
return t.comment
}
// getIndex returns the virtual index with the input ID.
func (t virtualSchemaTable) getIndex(id descpb.IndexID) *virtualIndex {
// Subtract 2 from the index id to get the ordinal in def.indexes, since
// the index with ID 1 is the "primary" index defined by def.populate.
return &t.indexes[id-2]
}
// unimplemented retrieves whether the virtualSchemaDef is implemented or not.
func (t virtualSchemaTable) isUnimplemented() bool {
return t.unimplemented
}
// preferIndexOverGenerator defines the cases in which we are able to use a
// virtual index's populate function when we have a virtual table defined with
// a generator function instead of a populate function. Specifically, use of a
// virtual index is supported when we have only single key constraints, and are
// not using a partial index, and therefore do not need to fallback on an
// undefined populate function.
func (t virtualSchemaTable) preferIndexOverGenerator(
p *planner, index catalog.Index, idxConstraint *constraint.Constraint,
) bool {
if idxConstraint == nil || idxConstraint.IsUnconstrained() {
return false
}
if index.GetID() == 1 {
return false
}
virtualIdx := t.getIndex(index.GetID())
if virtualIdx.incomplete {
return false
}
for i := 0; i < idxConstraint.Spans.Count(); i++ {
constraintSpan := idxConstraint.Spans.Get(i)
if !constraintSpan.HasSingleKey(p.EvalContext()) {
return false
}
}
return true
}
// getSchema is part of the virtualSchemaDef interface.
func (v virtualSchemaView) getSchema() string {
return v.schema
}
// initVirtualTableDesc is part of the virtualSchemaDef interface.
func (v virtualSchemaView) initVirtualTableDesc(
ctx context.Context, st *cluster.Settings, sc catalog.SchemaDescriptor, id descpb.ID,
) (descpb.TableDescriptor, error) {
stmt, err := parser.ParseOne(v.schema)
if err != nil {
return descpb.TableDescriptor{}, err
}
create := stmt.AST.(*tree.CreateView)
columns := v.resultColumns
if len(create.ColumnNames) != 0 {
columns = overrideColumnNames(columns, create.ColumnNames)
}
mutDesc, err := makeViewTableDesc(
ctx,
create.Name.Table(),
tree.AsStringWithFlags(create.AsSource, tree.FmtParsable),
0,
sc.GetID(),
id,
columns,
startTime,
catpb.NewPrivilegeDescriptor(
username.PublicRoleName(),
privilege.List{privilege.SELECT},
privilege.List{},
username.NodeUserName(),
),
nil, // semaCtx
// We explicitly pass in a half-baked EvalContext because we don't need to
// evaluate any expressions to initialize virtual tables. We do need to
// pass in the cluster settings to make sure that functions can properly
// evaluate version gates, though.
&eval.Context{Settings: st}, /* evalCtx */
st,
tree.PersistencePermanent,
false, // isMultiRegion
nil, // sc
)
return mutDesc.TableDescriptor, err
}
// getComment is part of the virtualSchemaDef interface.
func (v virtualSchemaView) getComment() string {
return v.comment
}
// isUnimplemented is part of the virtualSchemaDef interface.
func (v virtualSchemaView) isUnimplemented() bool {
return false
}
// virtualSchemas holds a slice of statically registered virtualSchema objects.
//
// When adding a new virtualSchema, define a virtualSchema in a separate file, and
// add that object to this slice.
var virtualSchemas = map[descpb.ID]virtualSchema{
catconstants.InformationSchemaID: informationSchema,
catconstants.PgCatalogID: pgCatalog,
catconstants.CrdbInternalID: crdbInternal,
catconstants.PgExtensionSchemaID: pgExtension,
}
var startTime = hlc.Timestamp{
WallTime: time.Date(2000, time.January, 1, 0, 0, 0, 0, time.UTC).UnixNano(),
}
//
// SQL-layer interface to work with virtual schemas.
//
// VirtualSchemaHolder is a type used to provide convenient access to virtual
// database and table descriptors. VirtualSchemaHolder, virtualSchemaEntry,
// and virtualDefEntry make up the generated data structure which the
// virtualSchemas slice is mapped to. Because of this, they should not be
// created directly, but instead will be populated in a post-startup hook
// on an Executor.
type VirtualSchemaHolder struct {
schemasByName map[string]*virtualSchemaEntry
schemasByID map[descpb.ID]*virtualSchemaEntry
defsByID map[descpb.ID]*virtualDefEntry
orderedNames []string
}
var _ VirtualTabler = (*VirtualSchemaHolder)(nil)
// GetVirtualSchema makes VirtualSchemaHolder implement catalog.VirtualSchemas.
func (vs *VirtualSchemaHolder) GetVirtualSchema(schemaName string) (catalog.VirtualSchema, bool) {
sc, ok := vs.schemasByName[schemaName]
return sc, ok
}
// GetVirtualSchemaByID makes VirtualSchemaHolder implement catalog.VirtualSchemas.
func (vs *VirtualSchemaHolder) GetVirtualSchemaByID(id descpb.ID) (catalog.VirtualSchema, bool) {
sc, ok := vs.schemasByID[id]
return sc, ok
}
// GetVirtualObjectByID makes VirtualSchemaHolder implement catalog.VirtualSchemas.
func (vs *VirtualSchemaHolder) GetVirtualObjectByID(id descpb.ID) (catalog.VirtualObject, bool) {
entry, ok := vs.defsByID[id]
if !ok {
return nil, false
}
return entry, true
}
// Visit makes VirtualSchemaHolder implement catalog.VirtualSchemas.
func (vs *VirtualSchemaHolder) Visit(fn func(desc catalog.Descriptor, comment string) error) error {
for _, sc := range vs.schemasByID {
if err := fn(sc.desc, "" /* comment */); err != nil {
return iterutil.Map(err)
}
for _, def := range sc.defs {
if err := fn(def.desc, def.comment); err != nil {
return iterutil.Map(err)
}
}
}
return nil
}
var _ catalog.VirtualSchemas = (*VirtualSchemaHolder)(nil)
type virtualSchemaEntry struct {
desc catalog.SchemaDescriptor
defs map[string]*virtualDefEntry
orderedDefNames []string
undefinedTables map[string]struct{}
containsTypes bool
}
func (v *virtualSchemaEntry) Desc() catalog.SchemaDescriptor {
return v.desc
}
func (v *virtualSchemaEntry) NumTables() int {
return len(v.defs)
}
func (v *virtualSchemaEntry) VisitTables(f func(object catalog.VirtualObject)) {
for _, name := range v.orderedDefNames {
f(v.defs[name])
}
}
func (v *virtualSchemaEntry) GetObjectByName(
name string, kind tree.DesiredObjectKind,
) (catalog.VirtualObject, error) {
switch kind {
case tree.TypeObject:
// Currently, we don't allow creation of types in virtual schemas, so
// the only types present in the virtual schemas that have types (i.e.
// pg_catalog) are types that are known at parse time or implicit record
// types for each table. So, first attempt to
// parse the input object as a statically known type. Note that an
// invalid input type like "notatype" will be parsed successfully as
// a ResolvableTypeReference, so the error here does not need to be
// intercepted and inspected.
if v.containsTypes {
typRef, err := parser.GetTypeReferenceFromName(tree.Name(name))
if err != nil {
return nil, err
}
// If the parsed reference is actually a statically known type, then
// we can return it. We return a simple wrapping of this type as
// TypeDescriptor that represents an alias of the result type.
typ, ok := tree.GetStaticallyKnownType(typRef)
if ok {
return &virtualTypeEntry{
desc: typedesc.MakeSimpleAlias(typ, catconstants.PgCatalogID),
}, nil
}
}
// If the type could not be found statically, then search for a table with
// this name so the implicit record type can be used.
fallthrough
case tree.TableObject:
if def, ok := v.defs[name]; ok {
return def, nil
}
if _, ok := v.undefinedTables[name]; ok {
return nil, newUnimplementedVirtualTableError(v.desc.GetName(), name)
}
}
return nil, nil
}
type virtualDefEntry struct {
virtualDef virtualSchemaDef
desc catalog.TableDescriptor
comment string
validWithNoDatabaseContext bool
unimplemented bool
}
func (e *virtualDefEntry) Desc() catalog.Descriptor {
return e.desc
}
func canQueryVirtualTable(evalCtx *eval.Context, e *virtualDefEntry) bool {
return !e.unimplemented ||
evalCtx == nil ||
evalCtx.SessionData() == nil ||
evalCtx.SessionData().StubCatalogTablesEnabled
}
type virtualTypeEntry struct {
desc catalog.TypeDescriptor
}
func (e *virtualTypeEntry) Desc() catalog.Descriptor {
return e.desc
}
type virtualTableConstructor func(context.Context, *planner, string) (planNode, error)
var errInvalidDbPrefix = errors.WithHint(
pgerror.New(pgcode.UndefinedObject,
"cannot access virtual schema in anonymous database"),
"verify that the current database is set")
func newInvalidVirtualSchemaError() error {
return errors.AssertionFailedf("virtualSchema cannot have both the populate and generator functions defined")
}
func newInvalidVirtualDefEntryError() error {
return errors.AssertionFailedf("virtualDefEntry.virtualDef must be a virtualSchemaTable")
}
func (e *virtualDefEntry) validateRow(datums tree.Datums, columns colinfo.ResultColumns) error {
if r, c := len(datums), len(columns); r != c {
return errors.AssertionFailedf("datum row count and column count differ: %d vs %d", r, c)
}
for i := range columns {
col := &columns[i]
datum := datums[i]
if datum == tree.DNull {
if !e.desc.PublicColumns()[i].IsNullable() {
return errors.AssertionFailedf("column %s.%s not nullable, but found NULL value",
e.desc.GetName(), col.Name)
}
} else if !datum.ResolvedType().Equivalent(col.Typ) {
return errors.AssertionFailedf("datum column %q expected to be type %s; found type %s",
col.Name, col.Typ, datum.ResolvedType())
}
}
return nil
}
// getPlanInfo returns the column metadata and a constructor for a new
// valuesNode for the virtual table. We use deferred construction here
// so as to avoid populating a RowContainer during query preparation,
// where we can't guarantee it will be Close()d in case of error.
func (e *virtualDefEntry) getPlanInfo(
table catalog.TableDescriptor,
index catalog.Index,
idxConstraint *constraint.Constraint,
stopper *stop.Stopper,
) (colinfo.ResultColumns, virtualTableConstructor) {
var columns colinfo.ResultColumns
for _, col := range e.desc.PublicColumns() {
columns = append(columns, colinfo.ResultColumn{
Name: col.GetName(),
Typ: col.GetType(),
TableID: table.GetID(),
PGAttributeNum: uint32(col.GetPGAttributeNum()),
})
}
constructor := func(ctx context.Context, p *planner, dbName string) (planNode, error) {
var dbDesc catalog.DatabaseDescriptor
var err error
if dbName != "" {
dbDesc, err = p.byNameGetterBuilder().Get().Database(ctx, dbName)
if err != nil {
return nil, err
}
} else {
if !e.validWithNoDatabaseContext {
return nil, errInvalidDbPrefix
}
}
switch def := e.virtualDef.(type) {
case virtualSchemaTable:
if def.generator != nil && def.populate != nil {
return nil, newInvalidVirtualSchemaError()
}
if def.generator != nil && !def.preferIndexOverGenerator(p, index, idxConstraint) {
next, cleanup, err := def.generator(ctx, p, dbDesc, stopper)
if err != nil {
return nil, err
}
if index != nil && index.IsPartial() {
if next, err = e.wrapVirtualTableGeneratorWithPartialIndexPredicate(
ctx, p, index, next,
); err != nil {
return nil, err
}
}
return p.newVirtualTableNode(columns, next, cleanup), nil
}
constrainedScan := idxConstraint != nil && !idxConstraint.IsUnconstrained()
if !constrainedScan {
var filter func(tree.Datums) (bool, error)
if index != nil && index.IsPartial() {
if filter, err = e.getIndexPredicateFilter(ctx, p, index); err != nil {
return nil, err
}
}
generator, cleanup, setupError := setupGenerator(ctx, func(ctx context.Context, pusher rowPusher) error {
return def.populate(ctx, p, dbDesc, func(row ...tree.Datum) error {
if err := e.validateRow(row, columns); err != nil {
return err
}
if filter != nil {
if matched, err := filter(row); err != nil || !matched {
return err
}
}
return pusher.pushRow(row...)
})
}, stopper)
if setupError != nil {
return nil, setupError
}
return p.newVirtualTableNode(columns, generator, cleanup), nil
}
// We are now dealing with a constrained virtual index scan.
if index.GetID() == 1 {
return nil, errors.AssertionFailedf(
"programming error: can't constrain scan on primary virtual index of table %s", e.desc.GetName())
}
// Figure out the ordinal position of the column that we're filtering on.
columnIdxMap := catalog.ColumnIDToOrdinalMap(table.PublicColumns())
indexKeyDatums := make([]tree.Datum, index.NumKeyColumns())
generator, cleanup, setupError := setupGenerator(ctx, e.makeConstrainedRowsGenerator(
p, dbDesc, index, indexKeyDatums, columnIdxMap, idxConstraint, columns), stopper)
if setupError != nil {
return nil, setupError
}
return p.newVirtualTableNode(columns, generator, cleanup), nil
default:
return nil, newInvalidVirtualDefEntryError()
}
}
return columns, constructor
}
// wrapVirtualTableGeneratorWithPartialIndexPredicate will filter the
// virtualTableGenerator rows which do not match the partial index predicate.
// The passed index must exist and be partial.
func (e *virtualDefEntry) wrapVirtualTableGeneratorWithPartialIndexPredicate(
ctx context.Context, p *planner, index catalog.Index, src virtualTableGenerator,
) (virtualTableGenerator, error) {
partialFilter, err := e.getIndexPredicateFilter(ctx, p, index)
if err != nil {
return nil, err
}
return func() (tree.Datums, error) {
for {
datums, err := src()
if err != nil {
return nil, err
}
if datums == nil {
return nil, nil
}
matched, err := partialFilter(datums)
if err != nil {
return nil, err
}
if matched {
return datums, nil
}
}
}, nil
}
// makeConstrainedRowsGenerator returns a generator function that can be invoked
// to push all rows from this virtual table that satisfy the input index
// constraint to a row pusher that's supplied to the generator function.
func (e *virtualDefEntry) makeConstrainedRowsGenerator(
p *planner,
dbDesc catalog.DatabaseDescriptor,
index catalog.Index,
indexKeyDatums []tree.Datum,
columnIdxMap catalog.TableColMap,
idxConstraint *constraint.Constraint,
columns colinfo.ResultColumns,
) func(ctx context.Context, pusher rowPusher) error {
def := e.virtualDef.(virtualSchemaTable)
return func(ctx context.Context, pusher rowPusher) error {
var span constraint.Span
var partialIndexPredicate func(datums tree.Datums) (matched bool, _ error)
addRowIfPassesFilter := func(idxConstraint *constraint.Constraint) func(datums ...tree.Datum) error {
return func(datums ...tree.Datum) error {
for i := 0; i < index.NumKeyColumns(); i++ {
id := index.GetKeyColumnID(i)
indexKeyDatums[i] = datums[columnIdxMap.GetDefault(id)]
}
// Construct a single key span out of the current row, so that
// we can test it for containment within the constraint span of the
// filter that we're applying. The results of this containment check
// will tell us whether or not to let the current row pass the filter.
key := constraint.MakeCompositeKey(indexKeyDatums...)
span.Init(key, constraint.IncludeBoundary, key, constraint.IncludeBoundary)
if !idxConstraint.ContainsSpan(p.EvalContext(), &span) {
return nil
}
if err := e.validateRow(datums, columns); err != nil {
return err
}
if partialIndexPredicate != nil {
matched, err := partialIndexPredicate(datums)
if err != nil {
return err
}
if !matched {
return nil
}
}
return pusher.pushRow(datums...)
}
}
// We have a virtual index with a constraint. Run the constrained
// populate routine for every span. If for some reason we can't use the
// index for a given span, we exit the loop early and run a "full scan"
// over the virtual table, filtering the output using the remaining
// spans.
var currentSpan int
for ; currentSpan < idxConstraint.Spans.Count(); currentSpan++ {
span := idxConstraint.Spans.Get(currentSpan)
if span.StartKey().Length() > 1 {
return errors.AssertionFailedf(
"programming error: can't push down composite constraints into vtables")
}
if !span.HasSingleKey(p.EvalContext()) {
// No hope - we can't deal with range scans on virtual indexes.
break
}
constraintDatum := span.StartKey().Value(0)
unwrappedConstraint := eval.UnwrapDatum(ctx, p.EvalContext(), constraintDatum)
virtualIndex := def.getIndex(index.GetID())
// NULL constraint will not match any row.
matched := unwrappedConstraint != tree.DNull
if matched {
// For each span, run the index's populate method, constrained to the
// constraint span's value.
var err error
matched, err = virtualIndex.populate(ctx, unwrappedConstraint, p, dbDesc,
addRowIfPassesFilter(idxConstraint))
if err != nil {
return err
}
}
if !matched && virtualIndex.incomplete {
// If no row was matched, and the index was incomplete, we have no choice
// but to populate the entire table and search through it.
break
}
}
if currentSpan == idxConstraint.Spans.Count() {
// We successfully processed all constraints, so we can leave now.
return nil
}
// Fall back to a full scan of the table, using the remaining filters
// that weren't able to be used as constraints.
newConstraint := *idxConstraint
newConstraint.Spans = constraint.Spans{}
nSpans := idxConstraint.Spans.Count() - currentSpan
newConstraint.Spans.Alloc(nSpans)
for ; currentSpan < idxConstraint.Spans.Count(); currentSpan++ {
newConstraint.Spans.Append(idxConstraint.Spans.Get(currentSpan))
}
// If the index that was chosen but not used was a partial index, we need
// to make sure we apply the same predicate to all rows of the primary
// index.
if index != nil && index.IsPartial() {
var err error
partialIndexPredicate, err = e.getIndexPredicateFilter(ctx, p, index)
if err != nil {
return err
}
}
// NB: If we allow virtualSchemaTables with generator to perform a constrained scan,
// we then need to ensure that we don't call populate without checking, as it may be nil.
if def.populate == nil {
return errors.AssertionFailedf(
"programming error: can't fall back to unconstrained scan on generated vtables")
}
return def.populate(ctx, p, dbDesc, addRowIfPassesFilter(&newConstraint))
}
}
// getIndexPredicateFilter returns a function which can be used to filter
// rows of a virtual table which do not match the corresponding index predicate.
// The index must be non-nil and partial. We need this because there are cases
// the optimizer will choose to scan a virtual index but the index cannot be
// used to serve the query. Instead, we need to scan the primary index and then
// constrain it as though the partial index were scanned.
func (e *virtualDefEntry) getIndexPredicateFilter(
ctx context.Context, p *planner, index catalog.Index,
) (func(datums tree.Datums) (matched bool, _ error), error) {
if index == nil || !index.IsPartial() {
return nil, errors.AssertionFailedf("cannot construct filter for a non-partial index %v", index)
}
expr, err := schemaexpr.MakePartialIndexExpr(ctx, e.desc, index, p.EvalContext(), p.SemaCtx())
if err != nil {
return nil, errors.NewAssertionErrorWithWrappedErrf(err, "failed to construct partial index constraints")
}
publicColumns := e.desc.PublicColumns()
r := schemaexpr.RowIndexedVarContainer{
Cols: publicColumns,
}
for i, c := range publicColumns {
r.Mapping.Set(c.GetID(), i)
}
return func(datums tree.Datums) (matched bool, _ error) {
r.CurSourceRow = datums
p.EvalContext().PushIVarContainer(&r)
defer p.EvalContext().PopIVarContainer()
got, err := eval.Expr(ctx, p.EvalContext(), expr)
if err != nil {
return false, err
}
if got == tree.DNull {
return false, nil
}
return bool(tree.MustBeDBool(got)), nil
}, nil
}
// NewVirtualSchemaHolder creates a new VirtualSchemaHolder.
func NewVirtualSchemaHolder(
ctx context.Context, st *cluster.Settings,
) (*VirtualSchemaHolder, error) {
vs := &VirtualSchemaHolder{
schemasByName: make(map[string]*virtualSchemaEntry, len(virtualSchemas)),
schemasByID: make(map[descpb.ID]*virtualSchemaEntry, len(virtualSchemas)),
orderedNames: make([]string, len(virtualSchemas)),
defsByID: make(map[descpb.ID]*virtualDefEntry, math.MaxUint32-catconstants.MinVirtualID),
}
order := 0
for schemaID, schema := range virtualSchemas {
scDesc, ok := schemadesc.GetVirtualSchemaByID(schemaID)
if !ok {
return nil, errors.AssertionFailedf("failed to find virtual schema %d (%s)", schemaID, schema.name)
}
if scDesc.GetName() != schema.name {
return nil, errors.AssertionFailedf("schema name mismatch for virtual schema %d: expected %s, found %s",
schemaID, schema.name, scDesc.GetName())
}
defs := make(map[string]*virtualDefEntry, len(schema.tableDefs))
orderedDefNames := make([]string, 0, len(schema.tableDefs))
for id, def := range schema.tableDefs {
tableDesc, err := def.initVirtualTableDesc(ctx, st, scDesc, id)
if err != nil {
return nil, errors.NewAssertionErrorWithWrappedErrf(err,
"failed to initialize %s", errors.Safe(def.getSchema()))
}
if schema.tableValidator != nil {
if err := schema.tableValidator(&tableDesc); err != nil {
return nil, errors.NewAssertionErrorWithWrappedErrf(err, "programmer error")
}
}
td := tabledesc.NewBuilder(&tableDesc).BuildImmutableTable()
version := st.Version.ActiveVersionOrEmpty(ctx)
dvmp := catsessiondata.NewDescriptorSessionDataProvider(nil /* sd */)
if err := descs.ValidateSelf(td, version, dvmp); err != nil {
return nil, errors.NewAssertionErrorWithWrappedErrf(err,
"failed to validate virtual table %s: programmer error", errors.Safe(td.GetName()))
}
entry := &virtualDefEntry{
virtualDef: def,
desc: td,
validWithNoDatabaseContext: schema.validWithNoDatabaseContext,
comment: def.getComment(),
unimplemented: def.isUnimplemented(),
}
defs[tableDesc.Name] = entry
vs.defsByID[tableDesc.ID] = entry
orderedDefNames = append(orderedDefNames, tableDesc.Name)
}
sort.Strings(orderedDefNames)
vse := &virtualSchemaEntry{
desc: scDesc,
defs: defs,
orderedDefNames: orderedDefNames,
undefinedTables: schema.undefinedTables,
containsTypes: schema.containsTypes,
}
vs.schemasByName[scDesc.GetName()] = vse
vs.schemasByID[scDesc.GetID()] = vse
vs.orderedNames[order] = scDesc.GetName()
order++
}
sort.Strings(vs.orderedNames)
return vs, nil
}
func newUnimplementedVirtualTableError(schema, tableName string) error {
return unimplemented.Newf(
fmt.Sprintf("%s.%s", schema, tableName),
virtualSchemaNotImplementedMessage,
schema,
tableName,
)
}
// getEntries is part of the VirtualTabler interface.
func (vs *VirtualSchemaHolder) getSchemas() map[string]*virtualSchemaEntry {
return vs.schemasByName
}
// getSchemaNames is part of the VirtualTabler interface.
func (vs *VirtualSchemaHolder) getSchemaNames() []string {
return vs.orderedNames
}
// getVirtualSchemaEntry retrieves a virtual schema entry given a database name.
// getVirtualSchemaEntry is part of the VirtualTabler interface.
func (vs *VirtualSchemaHolder) getVirtualSchemaEntry(name string) (*virtualSchemaEntry, bool) {
e, ok := vs.schemasByName[name]
return e, ok
}
// getVirtualTableEntry checks if the provided name matches a virtual database/table
// pair. The function will return the table's virtual table entry if the name matches
// a specific table. It will return an error if the name references a virtual database
// but the table is non-existent.
// getVirtualTableEntry is part of the VirtualTabler interface.
func (vs *VirtualSchemaHolder) getVirtualTableEntry(tn *tree.TableName) (*virtualDefEntry, error) {
if db, ok := vs.getVirtualSchemaEntry(tn.Schema()); ok {
tableName := tn.Table()
if t, ok := db.defs[tableName]; ok {
sqltelemetry.IncrementGetVirtualTableEntry(tn.Schema(), tableName)
return t, nil
}
if _, ok := db.undefinedTables[tableName]; ok {
return nil, unimplemented.NewWithIssueDetailf(
8675,
fmt.Sprintf("%s.%s", tn.Schema(), tableName),
virtualSchemaNotImplementedMessage,
tn.Schema(),
tableName,
)
}
return nil, sqlerrors.NewUndefinedRelationError(tn)
}
return nil, nil
}