diff --git a/pkg/sql/opt/memo/testdata/stats/join b/pkg/sql/opt/memo/testdata/stats/join index 177a20c51606..9726a3e27ba3 100644 --- a/pkg/sql/opt/memo/testdata/stats/join +++ b/pkg/sql/opt/memo/testdata/stats/join @@ -1481,7 +1481,7 @@ anti-join (lookup t.public.def) └── false [type=bool, constraints=(contradiction; tight)] # Regression test for #40460. -opt +opt disable=SimplifyJoinFilters SELECT * FROM diff --git a/pkg/sql/opt/norm/rules/join.opt b/pkg/sql/opt/norm/rules/join.opt index 3b51c0756c48..56295db1cfc3 100644 --- a/pkg/sql/opt/norm/rules/join.opt +++ b/pkg/sql/opt/norm/rules/join.opt @@ -19,9 +19,10 @@ $on:[ ... $item:(FiltersItem - (And | True | False | Null | Or) + (And | True | False | Null | Or | Is) ) & ^(IsUnsimplifiableOr $item) & + ^(IsUnsimplifiableIs $item) & ^(IsContradiction $item) ... ] & diff --git a/pkg/sql/opt/norm/rules/select.opt b/pkg/sql/opt/norm/rules/select.opt index 634d83233aab..f5e68ac41c91 100644 --- a/pkg/sql/opt/norm/rules/select.opt +++ b/pkg/sql/opt/norm/rules/select.opt @@ -18,9 +18,10 @@ $filters:[ ... $item:(FiltersItem - (And | True | False | Null | Or) + (And | True | False | Null | Or | Is) ) & - ^(IsUnsimplifiableOr $item) + ^(IsUnsimplifiableOr $item) & + ^(IsUnsimplifiableIs $item) ... ] & ^(IsFilterFalse $filters) diff --git a/pkg/sql/opt/norm/select_funcs.go b/pkg/sql/opt/norm/select_funcs.go index cded16084f73..b7589214e668 100644 --- a/pkg/sql/opt/norm/select_funcs.go +++ b/pkg/sql/opt/norm/select_funcs.go @@ -319,6 +319,18 @@ func (c *CustomFuncs) IsUnsimplifiableOr(item *memo.FiltersItem) bool { return or.Left.Op() != opt.NullOp && or.Right.Op() != opt.NullOp } +// IsUnsimplifiableIs returns true if this is an IS where the right side is not +// True or False. SimplifyFilters simplifies an IS expression with True or False +// as the right input to its left input. This function serves a similar purpose +// to IsUnsimplifiableOr. +func (c *CustomFuncs) IsUnsimplifiableIs(item *memo.FiltersItem) bool { + is, ok := item.Condition.(*memo.IsExpr) + if !ok { + return false + } + return is.Right.Op() != opt.TrueOp && is.Right.Op() != opt.FalseOp +} + // addConjuncts recursively walks a scalar expression as long as it continues to // find nested And operators. It adds any conjuncts (ignoring True operators) to // the given FiltersExpr and returns true. If it finds a False or Null operator, @@ -352,6 +364,24 @@ func (c *CustomFuncs) addConjuncts( filters = append(filters, c.f.ConstructFiltersItem(t)) } + case *memo.IsExpr: + // Attempt to replace IS (True | False) with the left input. Note + // that this replacement may cause Null to be returned where the original + // expression returned False, because IS (True | False) returns False on a + // Null input. However, in this case the replacement is valid because Select + // and Join operators treat False and Null filter conditions the same way + // (no rows returned). + if t.Right.Op() == opt.TrueOp { + // IS True => + filters = append(filters, c.f.ConstructFiltersItem(t.Left)) + } else if t.Right.Op() == opt.FalseOp { + // IS False => NOT + filters = append(filters, c.f.ConstructFiltersItem(c.f.ConstructNot(t.Left))) + } else { + // No replacement possible. + filters = append(filters, c.f.ConstructFiltersItem(t)) + } + default: filters = append(filters, c.f.ConstructFiltersItem(t)) } diff --git a/pkg/sql/opt/norm/testdata/rules/join b/pkg/sql/opt/norm/testdata/rules/join index 5d85b0d55902..9d212c6a5ab0 100644 --- a/pkg/sql/opt/norm/testdata/rules/join +++ b/pkg/sql/opt/norm/testdata/rules/join @@ -25,6 +25,10 @@ exec-ddl CREATE TABLE uv (u INT PRIMARY KEY, v INT) ---- +exec-ddl +CREATE TABLE booleans(a BOOL, b BOOL, c BOOL, d BOOL, e BOOL) +---- + norm SELECT * FROM a INNER JOIN b ON a.s='foo' OR b.y<10 ---- @@ -67,20 +71,197 @@ left-join (hash) └── k:1 = x:7 [outer=(1,7), constraints=(/1: (/NULL - ]; /7: (/NULL - ]), fd=(1)==(7), (7)==(1)] # -------------------------------------------------- -# DetectJoinContradiction +# SimplifyJoinFilters # -------------------------------------------------- -norm expect=DetectJoinContradiction -SELECT * FROM a INNER JOIN b ON (k<1 AND k>2) OR (k<4 AND k>5) +norm expect=SimplifyJoinFilters +SELECT * FROM a INNER JOIN xy ON x=1 OR NULL ---- -values - ├── columns: k:1!null i:2!null f:3!null s:4!null j:5!null x:7!null y:8!null - ├── cardinality: [0 - 0] - ├── key: () - └── fd: ()-->(1-5,7,8) +inner-join (cross) + ├── columns: k:1!null i:2 f:3!null s:4 j:5 x:7!null y:8 + ├── multiplicity: left-rows(zero-or-one), right-rows(zero-or-more) + ├── key: (1) + ├── fd: ()-->(7,8), (1)-->(2-5) + ├── scan a + │ ├── columns: k:1!null i:2 f:3!null s:4 j:5 + │ ├── key: (1) + │ └── fd: (1)-->(2-5) + ├── select + │ ├── columns: x:7!null y:8 + │ ├── cardinality: [0 - 1] + │ ├── key: () + │ ├── fd: ()-->(7,8) + │ ├── scan xy + │ │ ├── columns: x:7!null y:8 + │ │ ├── key: (7) + │ │ └── fd: (7)-->(8) + │ └── filters + │ └── x:7 = 1 [outer=(7), constraints=(/7: [/1 - /1]; tight), fd=()-->(7)] + └── filters (true) -norm expect=DetectJoinContradiction -SELECT * FROM a LEFT JOIN b ON (k<1 AND k>2) OR (k<4 AND k>5) +norm expect=SimplifyJoinFilters +SELECT * FROM a INNER JOIN xy ON (k=x AND i=y) AND true AND (f=3.5 AND s='foo') +---- +inner-join (hash) + ├── columns: k:1!null i:2!null f:3!null s:4!null j:5 x:7!null y:8!null + ├── multiplicity: left-rows(zero-or-one), right-rows(zero-or-one) + ├── key: (7) + ├── fd: ()-->(3,4), (1)-->(2,5), (7)-->(8), (1)==(7), (7)==(1), (2)==(8), (8)==(2) + ├── select + │ ├── columns: k:1!null i:2 f:3!null s:4!null j:5 + │ ├── key: (1) + │ ├── fd: ()-->(3,4), (1)-->(2,5) + │ ├── scan a + │ │ ├── columns: k:1!null i:2 f:3!null s:4 j:5 + │ │ ├── key: (1) + │ │ └── fd: (1)-->(2-5) + │ └── filters + │ ├── f:3 = 3.5 [outer=(3), constraints=(/3: [/3.5 - /3.5]; tight), fd=()-->(3)] + │ └── s:4 = 'foo' [outer=(4), constraints=(/4: [/'foo' - /'foo']; tight), fd=()-->(4)] + ├── scan xy + │ ├── columns: x:7!null y:8 + │ ├── key: (7) + │ └── fd: (7)-->(8) + └── filters + ├── k:1 = x:7 [outer=(1,7), constraints=(/1: (/NULL - ]; /7: (/NULL - ]), fd=(1)==(7), (7)==(1)] + └── i:2 = y:8 [outer=(2,8), constraints=(/2: (/NULL - ]; /8: (/NULL - ]), fd=(2)==(8), (8)==(2)] + +norm expect-not=SimplifyJoinFilters +SELECT * FROM a INNER JOIN xy ON x=1 OR k=1 +---- +inner-join (cross) + ├── columns: k:1!null i:2 f:3!null s:4 j:5 x:7!null y:8 + ├── key: (1,7) + ├── fd: (1)-->(2-5), (7)-->(8) + ├── scan a + │ ├── columns: k:1!null i:2 f:3!null s:4 j:5 + │ ├── key: (1) + │ └── fd: (1)-->(2-5) + ├── scan xy + │ ├── columns: x:7!null y:8 + │ ├── key: (7) + │ └── fd: (7)-->(8) + └── filters + └── (x:7 = 1) OR (k:1 = 1) [outer=(1,7)] + +# Inner join case. Simplify IS True. +norm expect=SimplifyJoinFilters +SELECT * FROM xy INNER JOIN booleans ON (a AND x > 0) IS True +---- +inner-join (cross) + ├── columns: x:1!null y:2 a:4!null b:5 c:6 d:7 e:8 + ├── fd: ()-->(4), (1)-->(2) + ├── select + │ ├── columns: x:1!null y:2 + │ ├── key: (1) + │ ├── fd: (1)-->(2) + │ ├── scan xy + │ │ ├── columns: x:1!null y:2 + │ │ ├── key: (1) + │ │ └── fd: (1)-->(2) + │ └── filters + │ └── x:1 > 0 [outer=(1), constraints=(/1: [/1 - ]; tight)] + ├── select + │ ├── columns: a:4!null b:5 c:6 d:7 e:8 + │ ├── fd: ()-->(4) + │ ├── scan booleans + │ │ └── columns: a:4 b:5 c:6 d:7 e:8 + │ └── filters + │ └── a:4 [outer=(4), constraints=(/4: [/true - /true]; tight), fd=()-->(4)] + └── filters (true) + +# Inner join case. Simplify is False. +norm expect=SimplifyJoinFilters +SELECT * FROM xy INNER JOIN booleans ON (a AND x > 0) IS False +---- +inner-join (cross) + ├── columns: x:1!null y:2 a:4 b:5 c:6 d:7 e:8 + ├── fd: (1)-->(2) + ├── scan xy + │ ├── columns: x:1!null y:2 + │ ├── key: (1) + │ └── fd: (1)-->(2) + ├── scan booleans + │ └── columns: a:4 b:5 c:6 d:7 e:8 + └── filters + └── (NOT a:4) OR (x:1 <= 0) [outer=(1,4)] + +# Left join case. Simplify IS True. +norm expect=SimplifyJoinFilters +SELECT * FROM xy LEFT JOIN booleans ON (a AND x > 0) IS True +---- +left-join (cross) + ├── columns: x:1!null y:2 a:4 b:5 c:6 d:7 e:8 + ├── fd: (1)-->(2) + ├── scan xy + │ ├── columns: x:1!null y:2 + │ ├── key: (1) + │ └── fd: (1)-->(2) + ├── select + │ ├── columns: a:4!null b:5 c:6 d:7 e:8 + │ ├── fd: ()-->(4) + │ ├── scan booleans + │ │ └── columns: a:4 b:5 c:6 d:7 e:8 + │ └── filters + │ └── a:4 [outer=(4), constraints=(/4: [/true - /true]; tight), fd=()-->(4)] + └── filters + └── x:1 > 0 [outer=(1), constraints=(/1: [/1 - ]; tight)] + +# Full join case. Simplify IS True. +norm expect=SimplifyJoinFilters +SELECT * FROM xy FULL JOIN booleans ON (a AND x > 0) IS True +---- +full-join (cross) + ├── columns: x:1 y:2 a:4 b:5 c:6 d:7 e:8 + ├── fd: (1)-->(2) + ├── scan xy + │ ├── columns: x:1!null y:2 + │ ├── key: (1) + │ └── fd: (1)-->(2) + ├── scan booleans + │ └── columns: a:4 b:5 c:6 d:7 e:8 + └── filters + ├── a:4 [outer=(4), constraints=(/4: [/true - /true]; tight), fd=()-->(4)] + └── x:1 > 0 [outer=(1), constraints=(/1: [/1 - ]; tight)] + +# Do not simplify IS NOT (when inputs are nullable). +norm expect-not=SimplifyJoinFilters +SELECT * FROM xy INNER JOIN booleans ON (a AND x > 0) IS NOT True +---- +inner-join (cross) + ├── columns: x:1!null y:2 a:4 b:5 c:6 d:7 e:8 + ├── fd: (1)-->(2) + ├── scan xy + │ ├── columns: x:1!null y:2 + │ ├── key: (1) + │ └── fd: (1)-->(2) + ├── scan booleans + │ └── columns: a:4 b:5 c:6 d:7 e:8 + └── filters + └── (a:4 AND (x:1 > 0)) IS NOT true [outer=(1,4)] + +# Do not simplify the IS because the right argument is Null (vs True or False). +norm expect-not=SimplifyJoinFilters +SELECT * FROM xy INNER JOIN booleans ON (a AND x > 0) IS Null +---- +inner-join (cross) + ├── columns: x:1!null y:2 a:4 b:5 c:6 d:7 e:8 + ├── fd: (1)-->(2) + ├── scan xy + │ ├── columns: x:1!null y:2 + │ ├── key: (1) + │ └── fd: (1)-->(2) + ├── scan booleans + │ └── columns: a:4 b:5 c:6 d:7 e:8 + └── filters + └── (a:4 AND (x:1 > 0)) IS NULL [outer=(1,4)] + +# Regression test for #54717. SimplifyJoinFilters should not simplify +# contradictions. Doing so can split the filter expressions into two +# FiltersItems such that they are no longer considered a contradiction, and +# DetectJoinContradiction does not fire. +norm expect=DetectJoinContradiction expect-not=SimplifyJoinFilters +SELECT * FROM a LEFT JOIN b ON k<1 AND k>2 ---- left-join (cross) ├── columns: k:1!null i:2 f:3!null s:4 j:5 x:7 y:8 @@ -98,12 +279,21 @@ left-join (cross) │ └── fd: ()-->(7,8) └── filters (true) -# Regression test for #54717. SimplifyJoinFilters should not simplify -# contradictions. Doing so can split the filter expressions into two -# FiltersItems such that they are no longer considered a contradiction, and -# DetectJoinContradiction does not fire. -norm expect=DetectJoinContradiction expect-not=SimplifyJoinFilters -SELECT * FROM a LEFT JOIN b ON k<1 AND k>2 +# -------------------------------------------------- +# DetectJoinContradiction +# -------------------------------------------------- + +norm expect=DetectJoinContradiction +SELECT * FROM a INNER JOIN b ON (k<1 AND k>2) OR (k<4 AND k>5) +---- +values + ├── columns: k:1!null i:2!null f:3!null s:4!null j:5!null x:7!null y:8!null + ├── cardinality: [0 - 0] + ├── key: () + └── fd: ()-->(1-5,7,8) + +norm expect=DetectJoinContradiction +SELECT * FROM a LEFT JOIN b ON (k<1 AND k>2) OR (k<4 AND k>5) ---- left-join (cross) ├── columns: k:1!null i:2 f:3!null s:4 j:5 x:7 y:8 @@ -2596,7 +2786,7 @@ project # -------------------------------------------------- # SimplifyJoinNotNullEquality # -------------------------------------------------- -norm expect=SimplifyJoinNotNullEquality +norm expect=SimplifyJoinNotNullEquality disable=SimplifyJoinFilters SELECT * FROM a INNER JOIN b ON (a.k=b.x) IS True ---- inner-join (hash) @@ -2615,7 +2805,7 @@ inner-join (hash) └── filters └── k:1 = x:7 [outer=(1,7), constraints=(/1: (/NULL - ]; /7: (/NULL - ]), fd=(1)==(7), (7)==(1)] -norm expect=SimplifyJoinNotNullEquality +norm expect=SimplifyJoinNotNullEquality disable=SimplifyJoinFilters SELECT * FROM a INNER JOIN b ON (a.k=b.x) IS False ---- inner-join (cross) @@ -2744,7 +2934,7 @@ inner-join (hash) # Don't trigger rule when one of the variables is nullable. norm expect-not=SimplifyJoinNotNullEquality -SELECT * FROM a INNER JOIN b ON (a.k=b.y) IS True AND (a.i=b.x) IS False +SELECT * FROM a INNER JOIN b ON (a.k=b.y) IS Null AND (a.i=b.x) IS NOT False ---- inner-join (cross) ├── columns: k:1!null i:2 f:3!null s:4 j:5 x:7!null y:8 @@ -2759,8 +2949,8 @@ inner-join (cross) │ ├── key: (7) │ └── fd: (7)-->(8) └── filters - ├── (k:1 = y:8) IS true [outer=(1,8)] - └── (i:2 = x:7) IS false [outer=(2,7)] + ├── (k:1 = y:8) IS NULL [outer=(1,8)] + └── (i:2 = x:7) IS NOT false [outer=(2,7)] # -------------------------------------------------- # ExtractJoinEqualities diff --git a/pkg/sql/opt/norm/testdata/rules/select b/pkg/sql/opt/norm/testdata/rules/select index a241f4f1b97c..d21cbdbf9e23 100644 --- a/pkg/sql/opt/norm/testdata/rules/select +++ b/pkg/sql/opt/norm/testdata/rules/select @@ -26,7 +26,7 @@ CREATE TABLE e ---- # -------------------------------------------------- -# SimplifyFilters +# SimplifySelectFilters # -------------------------------------------------- norm expect=SimplifySelectFilters SELECT * FROM a WHERE Null @@ -37,49 +37,6 @@ values ├── key: () └── fd: ()-->(1-5) -norm expect=SimplifyJoinFilters -SELECT * FROM a INNER JOIN xy ON x=1 OR NULL ----- -inner-join (cross) - ├── columns: k:1!null i:2 f:3 s:4 j:5 x:7!null y:8 - ├── multiplicity: left-rows(zero-or-one), right-rows(zero-or-more) - ├── key: (1) - ├── fd: ()-->(7,8), (1)-->(2-5) - ├── scan a - │ ├── columns: k:1!null i:2 f:3 s:4 j:5 - │ ├── key: (1) - │ └── fd: (1)-->(2-5) - ├── select - │ ├── columns: x:7!null y:8 - │ ├── cardinality: [0 - 1] - │ ├── key: () - │ ├── fd: ()-->(7,8) - │ ├── scan xy - │ │ ├── columns: x:7!null y:8 - │ │ ├── key: (7) - │ │ └── fd: (7)-->(8) - │ └── filters - │ └── x:7 = 1 [outer=(7), constraints=(/7: [/1 - /1]; tight), fd=()-->(7)] - └── filters (true) - -norm expect-not=SimplifyJoinFilters -SELECT * FROM a INNER JOIN xy ON x=1 OR k=1 ----- -inner-join (cross) - ├── columns: k:1!null i:2 f:3 s:4 j:5 x:7!null y:8 - ├── key: (1,7) - ├── fd: (1)-->(2-5), (7)-->(8) - ├── scan a - │ ├── columns: k:1!null i:2 f:3 s:4 j:5 - │ ├── key: (1) - │ └── fd: (1)-->(2-5) - ├── scan xy - │ ├── columns: x:7!null y:8 - │ ├── key: (7) - │ └── fd: (7)-->(8) - └── filters - └── (x:7 = 1) OR (k:1 = 1) [outer=(1,7)] - norm expect=SimplifySelectFilters SELECT * FROM a WHERE i=1 AND Null ---- @@ -136,32 +93,85 @@ select └── filters └── (k:1 = 1) OR (i:2 = 2) [outer=(1,2)] -norm expect=SimplifyJoinFilters -SELECT * FROM a INNER JOIN xy ON (k=x AND i=y) AND true AND (f=3.5 AND s='foo') +# Simplify IS True to its left input. +norm expect=SimplifySelectFilters +SELECT * FROM c WHERE a IS True ---- -inner-join (hash) - ├── columns: k:1!null i:2!null f:3!null s:4!null j:5 x:7!null y:8!null - ├── multiplicity: left-rows(zero-or-one), right-rows(zero-or-one) - ├── key: (7) - ├── fd: ()-->(3,4), (1)-->(2,5), (7)-->(8), (1)==(7), (7)==(1), (2)==(8), (8)==(2) +select + ├── columns: a:1!null b:2 c:3 d:4 e:5 + ├── fd: ()-->(1) + ├── scan c + │ └── columns: a:1 b:2 c:3 d:4 e:5 + └── filters + └── a:1 [outer=(1), constraints=(/1: [/true - /true]; tight), fd=()-->(1)] + +# Simplify IS False to the negation of its left input. +norm expect=SimplifySelectFilters +SELECT * FROM c WHERE a IS False +---- +select + ├── columns: a:1!null b:2 c:3 d:4 e:5 + ├── fd: ()-->(1) + ├── scan c + │ └── columns: a:1 b:2 c:3 d:4 e:5 + └── filters + └── NOT a:1 [outer=(1), constraints=(/1: [/false - /false]; tight), fd=()-->(1)] + +# Simplify a deeply nested IS True. +norm expect=SimplifySelectFilters +Select * FROM c WHERE a AND (b AND (c AND (d AND (e IS True)))) +---- +select + ├── columns: a:1!null b:2!null c:3!null d:4!null e:5!null + ├── fd: ()-->(1-5) + ├── scan c + │ └── columns: a:1 b:2 c:3 d:4 e:5 + └── filters + ├── a:1 [outer=(1), constraints=(/1: [/true - /true]; tight), fd=()-->(1)] + ├── b:2 [outer=(2), constraints=(/2: [/true - /true]; tight), fd=()-->(2)] + ├── c:3 [outer=(3), constraints=(/3: [/true - /true]; tight), fd=()-->(3)] + ├── d:4 [outer=(4), constraints=(/4: [/true - /true]; tight), fd=()-->(4)] + └── e:5 [outer=(5), constraints=(/5: [/true - /true]; tight), fd=()-->(5)] + +# Don't simplify the IS because the IS expression is a projection, not a Select +# filter. +norm expect-not=SimplifySelectFilters +Select a IS True FROM c WHERE b +---- +project + ├── columns: "?column?":8!null ├── select - │ ├── columns: k:1!null i:2 f:3!null s:4!null j:5 - │ ├── key: (1) - │ ├── fd: ()-->(3,4), (1)-->(2,5) - │ ├── scan a - │ │ ├── columns: k:1!null i:2 f:3 s:4 j:5 - │ │ ├── key: (1) - │ │ └── fd: (1)-->(2-5) + │ ├── columns: a:1 b:2!null + │ ├── fd: ()-->(2) + │ ├── scan c + │ │ └── columns: a:1 b:2 │ └── filters - │ ├── f:3 = 3.5 [outer=(3), constraints=(/3: [/3.5 - /3.5]; tight), fd=()-->(3)] - │ └── s:4 = 'foo' [outer=(4), constraints=(/4: [/'foo' - /'foo']; tight), fd=()-->(4)] - ├── scan xy - │ ├── columns: x:7!null y:8 - │ ├── key: (7) - │ └── fd: (7)-->(8) + │ └── b:2 [outer=(2), constraints=(/2: [/true - /true]; tight), fd=()-->(2)] + └── projections + └── a:1 IS true [as="?column?":8, outer=(1)] + +# Don't simplify an IS NOT expression. +norm expect-not=SimplifySelectFilters +SELECT * FROM c WHERE a IS NOT True +---- +select + ├── columns: a:1 b:2 c:3 d:4 e:5 + ├── scan c + │ └── columns: a:1 b:2 c:3 d:4 e:5 └── filters - ├── k:1 = x:7 [outer=(1,7), constraints=(/1: (/NULL - ]; /7: (/NULL - ]), fd=(1)==(7), (7)==(1)] - └── i:2 = y:8 [outer=(2,8), constraints=(/2: (/NULL - ]; /8: (/NULL - ]), fd=(2)==(8), (8)==(2)] + └── a:1 IS NOT true [outer=(1), constraints=(/1: [ - /false]; tight)] + +# Don't simplify the IS because its right argument is Null. +norm expect-not=SimplifySelectFilters +SELECT * FROM c WHERE a IS Null +---- +select + ├── columns: a:1 b:2 c:3 d:4 e:5 + ├── fd: ()-->(1) + ├── scan c + │ └── columns: a:1 b:2 c:3 d:4 e:5 + └── filters + └── a:1 IS NULL [outer=(1), constraints=(/1: [/NULL - /NULL]; tight), fd=()-->(1)] # -------------------------------------------------- # ConsolidateSelectFilters