Skip to content

Commit

Permalink
sql: fix left semi and left anti virtual lookup joins
Browse files Browse the repository at this point in the history
This commit fixes the execution of the left semi and left anti virtual
lookup joins. The bug was that we forgot to project away the looked up
columns (coming from the "right" side) which could then lead to wrong
columns being used higher up the tree. The bug was introduced during
22.1 release cycle where we added the optimizer support for generating
plans that could contain left semi and left anti virtual lookup joins.
This commit fixes that issue as well as the output columns of such joins
(I'm not sure whether there is a user facing impact of having incorrect
"output columns").

Additionally, this commit fixes the execution of these virtual lookup
joins to correctly return the input row only once. Previously, for left
anti joins we'd be producing an output row if there was a match (which
is wrong), and for both left semi and left anti we would emit an output
row every time there was a match (but this should be done only once).
(Although I'm not sure whether it is possible for virtual indexes to
result in multiple looked up rows.)

Also, as a minor simplification this commit makes it so that the output
rows are not added into the row container for left semi and left anti
and the container is not instantiated at all.

Release note (bug fix): CockroachDB previously could incorrectly
evaluate queries that performed left semi and left anti "virtual lookup"
joins on tables in `pg_catalog` or `information_schema`. These join types
can be planned when a subquery is used inside of a filter condition. The
bug was introduced in 22.1.0 and is now fixed.
  • Loading branch information
yuzefovich committed Dec 1, 2022
1 parent 21ec411 commit f58e248
Show file tree
Hide file tree
Showing 4 changed files with 98 additions and 17 deletions.
36 changes: 36 additions & 0 deletions pkg/sql/logictest/testdata/logic_test/pg_catalog
Original file line number Diff line number Diff line change
Expand Up @@ -4674,3 +4674,39 @@ order by attnum;
attnum attname
1 x
2 y

# Regression test for not projecting away looked up columns by the left semi
# virtual lookup join (#91012).
statement ok
CREATE TABLE t91012 (id INT, a_id INT);

query I
SELECT
count(*)
FROM
pg_class AS t INNER JOIN pg_attribute AS a ON t.oid = a.attrelid
WHERE
a.attnotnull = 'f'
AND a.attname = 'a_id'
AND t.relname = 't91012'
AND a.atttypid
IN (SELECT oid FROM pg_type WHERE typname = ANY (ARRAY['int8']));
----
1

# Regression test for incorrectly handling left anti virtual lookup joins
# (#88096).
statement ok
CREATE TYPE mytype AS enum('hello')

query I
SELECT
count(*)
FROM
pg_type AS t
WHERE
t.typrelid = 0
AND NOT EXISTS(SELECT 1 FROM pg_type AS el WHERE el.oid = t.typelem AND el.typarray = t.oid)
AND t.typname LIKE 'myt%'
----
1
1 change: 1 addition & 0 deletions pkg/sql/opt/xform/join_funcs.go
Original file line number Diff line number Diff line change
Expand Up @@ -292,6 +292,7 @@ func (c *CustomFuncs) GenerateLookupJoins(
//
// It should be possible to support semi- and anti- joins. Left joins may be
// possible with additional complexity.
// TODO(mgartner): update this comment.
//
// It should also be possible to support cases where all the virtual columns are
// not covered by a single index by wrapping the lookup join in a Project that
Expand Down
16 changes: 12 additions & 4 deletions pkg/sql/opt_exec_factory.go
Original file line number Diff line number Diff line change
Expand Up @@ -790,10 +790,18 @@ func (ef *execFactory) constructVirtualTableLookupJoin(
tableScan.index = idx
vtableCols := colinfo.ResultColumnsFromColumns(tableDesc.GetID(), tableDesc.PublicColumns())
projectedVtableCols := planColumns(&tableScan)
outputCols := make(colinfo.ResultColumns, 0, len(inputCols)+len(projectedVtableCols))
outputCols = append(outputCols, inputCols...)
outputCols = append(outputCols, projectedVtableCols...)
// joinType is either INNER or LEFT_OUTER.
var outputCols colinfo.ResultColumns
switch joinType {
case descpb.InnerJoin, descpb.LeftOuterJoin:
outputCols = make(colinfo.ResultColumns, 0, len(inputCols)+len(projectedVtableCols))
outputCols = append(outputCols, inputCols...)
outputCols = append(outputCols, projectedVtableCols...)
case descpb.LeftSemiJoin, descpb.LeftAntiJoin:
outputCols = make(colinfo.ResultColumns, 0, len(inputCols))
outputCols = append(outputCols, inputCols...)
default:
return nil, errors.AssertionFailedf("unexpected join type for virtual lookup join: %s", joinType.String())
}
pred := makePredicate(joinType, inputCols, projectedVtableCols)
pred.onCond = pred.iVarHelper.Rebind(onCond)
n := &vTableLookupJoinNode{
Expand Down
62 changes: 49 additions & 13 deletions pkg/sql/virtual_table.go
Original file line number Diff line number Diff line change
Expand Up @@ -235,9 +235,13 @@ type vTableLookupJoinNode struct {

// run contains the runtime state of this planNode.
run struct {
// matched indicates whether the current input row had at least one
// match.
matched bool
// row contains the next row to output.
row tree.Datums
// rows contains the next rows to output, except for row.
// rows contains the next rows to output, except for row. Only allocated
// for inner and left outer joins.
rows *rowcontainer.RowContainer
keyCtx constraint.KeyContext

Expand All @@ -257,10 +261,14 @@ var _ rowPusher = &vTableLookupJoinNode{}
// startExec implements the planNode interface.
func (v *vTableLookupJoinNode) startExec(params runParams) error {
v.run.keyCtx = constraint.KeyContext{EvalCtx: params.EvalContext()}
v.run.rows = rowcontainer.NewRowContainer(
params.p.Mon().MakeBoundAccount(),
colinfo.ColTypeInfoFromResCols(v.columns),
)
if v.joinType == descpb.InnerJoin || v.joinType == descpb.LeftOuterJoin {
v.run.rows = rowcontainer.NewRowContainer(
params.p.Mon().MakeBoundAccount(),
colinfo.ColTypeInfoFromResCols(v.columns),
)
} else if v.joinType != descpb.LeftSemiJoin && v.joinType != descpb.LeftAntiJoin {
return errors.AssertionFailedf("unexpected join type for virtual lookup join: %s", v.joinType.String())
}
v.run.indexKeyDatums = make(tree.Datums, len(v.columns))
var err error
db, err := params.p.Descriptors().GetImmutableDatabaseByName(
Expand All @@ -285,7 +293,7 @@ func (v *vTableLookupJoinNode) Next(params runParams) (bool, error) {
v.run.params = &params
for {
// Check if there are any rows left to emit from the last input row.
if v.run.rows.Len() > 0 {
if v.run.rows != nil && v.run.rows.Len() > 0 {
copy(v.run.row, v.run.rows.At(0))
v.run.rows.PopFirst(params.ctx)
return true, nil
Expand Down Expand Up @@ -315,18 +323,38 @@ func (v *vTableLookupJoinNode) Next(params runParams) (bool, error) {
)
// Add the input row to the left of the scratch row.
v.run.row = append(v.run.row[:0], inputRow...)
v.run.matched = false
// Finally, we're ready to do the lookup. This invocation will push all of
// the looked-up rows into v.run.rows.
if err := genFunc(params.ctx, v); err != nil {
return false, err
}
if v.run.rows.Len() == 0 && v.joinType == descpb.LeftOuterJoin {
// No matches - construct an outer match.
v.run.row = v.run.row[:len(v.inputCols)]
for i := len(inputRow); i < len(v.columns); i++ {
v.run.row = append(v.run.row, tree.DNull)
switch v.joinType {
case descpb.LeftOuterJoin:
if !v.run.matched {
// No matches - construct an outer match.
v.run.row = v.run.row[:len(v.inputCols)]
for i := len(inputRow); i < len(v.columns); i++ {
v.run.row = append(v.run.row, tree.DNull)
}
return true, nil
}
case descpb.LeftSemiJoin:
if v.run.matched {
// This input row had a match, so it should be emitted.
//
// Reset our output row to just the contents of the input row.
v.run.row = v.run.row[:len(v.inputCols)]
return true, nil
}
case descpb.LeftAntiJoin:
if !v.run.matched {
// This input row didn't have a match, so it should be emitted.
//
// Reset our output row to just the contents of the input row.
v.run.row = v.run.row[:len(v.inputCols)]
return true, nil
}
return true, nil
}
}
}
Expand All @@ -350,6 +378,12 @@ func (v *vTableLookupJoinNode) pushRow(lookedUpRow ...tree.Datum) error {
); !ok || err != nil {
return err
}
v.run.matched = true
if v.joinType == descpb.LeftSemiJoin || v.joinType == descpb.LeftAntiJoin {
// Avoid adding the row into the container since for left semi and left
// anti joins we only care to know whether there was a match or not.
return nil
}
_, err := v.run.rows.AddRow(v.run.params.ctx, v.run.row)
return err
}
Expand All @@ -362,5 +396,7 @@ func (v *vTableLookupJoinNode) Values() tree.Datums {
// Close implements the planNode interface.
func (v *vTableLookupJoinNode) Close(ctx context.Context) {
v.input.Close(ctx)
v.run.rows.Close(ctx)
if v.run.rows != nil {
v.run.rows.Close(ctx)
}
}

0 comments on commit f58e248

Please sign in to comment.