From 4391191f46dfaece8c67fa234cd83d77750235ee Mon Sep 17 00:00:00 2001 From: DrewKimball Date: Wed, 7 Sep 2022 19:02:08 -0700 Subject: [PATCH] opt: add scan constant columns to ordering if they are in the output Previously when building the provided ordering for a constrained scan, any columns proven to be constant by the constraint were ignored. This allows the optimizer to prove that the scan can provide orderings that omit those columns. However, in the case when one of these columns is an output column and the functional dependencies do not show it as constant, an internal error will result. This happens because the provided ordering omits the constant column, but the functional dependencies cannot later be used to show that the column was optional when checking whether the required ordering is satisfied. This commit modifies the logic to only avoid considering constrained-constant index columns to be added to the provided ordering when they are not output columns. Fixes #83793 Release note (bug fix): fixed a bug introduced in 21.2 that could cause an internal error in rare cases when a query required a constrained index scan to return results in order. --- pkg/sql/opt/ordering/scan.go | 12 +++++-- pkg/sql/opt/xform/testdata/physprops/ordering | 32 +++++++++++++++++++ 2 files changed, 41 insertions(+), 3 deletions(-) diff --git a/pkg/sql/opt/ordering/scan.go b/pkg/sql/opt/ordering/scan.go index 417cb1b32ce5..15de46c82669 100644 --- a/pkg/sql/opt/ordering/scan.go +++ b/pkg/sql/opt/ordering/scan.go @@ -130,14 +130,20 @@ func scanBuildProvided(expr memo.RelExpr, required *props.OrderingChoice) opt.Or // We generate the longest ordering that this scan can provide, then we trim // it. This is the longest prefix of index columns that are output by the scan // (ignoring constant columns, in the case of constrained scans). - // We start the for loop at the exact prefix since all columns in the exact - // prefix are constant and can be ignored. + outCols := expr.Relational().OutputCols constCols := fds.ComputeClosure(opt.ColSet{}) numCols := index.KeyColumnCount() provided := make(opt.Ordering, 0, numCols) - for i := scan.ExactPrefix; i < numCols; i++ { + for i := 0; i < numCols; i++ { indexCol := index.Column(i) colID := scan.Table.ColumnID(indexCol.Ordinal()) + if i < scan.ExactPrefix && !outCols.Contains(colID) { + // All columns in the exact prefix are constant and can be ignored as long + // as they are not in the output of the scan. If an exact-prefix column is + // in the output, it may still be constant, but can only be ignored if the + // FDs "know" it is constant. This latter case is handled below as normal. + continue + } if constCols.Contains(colID) { // Column constrained to a constant, ignore. continue diff --git a/pkg/sql/opt/xform/testdata/physprops/ordering b/pkg/sql/opt/xform/testdata/physprops/ordering index 7b5497e45911..c722e762bb0e 100644 --- a/pkg/sql/opt/xform/testdata/physprops/ordering +++ b/pkg/sql/opt/xform/testdata/physprops/ordering @@ -2709,3 +2709,35 @@ sort ├── cardinality: [0 - 0] ├── key: () └── fd: ()-->(6,12,23) + +# Regression test for #83793 - include scan columns that are constrained to be +# constant in the provided ordering when they are in the output of the scan. +exec-ddl +CREATE TABLE t83793 ( + a INT, + b STRING AS (a::STRING) STORED, + c STRING AS (a::STRING) VIRTUAL, + UNIQUE (b, a) +); +---- + +opt format=hide-all +SELECT NULL FROM t83793 +WHERE NOT (c NOT SIMILAR TO '') +GROUP BY b HAVING bool_and(NULL); +---- +project + ├── select + │ ├── group-by (streaming) + │ │ ├── project + │ │ │ ├── scan t83793@t83793_b_a_key + │ │ │ │ └── constraint: /2/1: [/'' - /''] + │ │ │ └── projections + │ │ │ └── NULL + │ │ └── aggregations + │ │ └── bool-and + │ │ └── column7 + │ └── filters + │ └── bool_and + └── projections + └── NULL