Skip to content

Commit

Permalink
feat: fail correlated subqueries if we are unable to merge them in a …
Browse files Browse the repository at this point in the history
…route

Signed-off-by: Manan Gupta <manan@planetscale.com>
  • Loading branch information
GuptaManan100 committed Dec 6, 2023
1 parent 3d53207 commit 228930d
Show file tree
Hide file tree
Showing 6 changed files with 32 additions and 22 deletions.
19 changes: 10 additions & 9 deletions go/vt/vtgate/planbuilder/operators/ast_to_op.go
Original file line number Diff line number Diff line change
Expand Up @@ -108,23 +108,24 @@ func findTablesContained(ctx *plancontext.PlanningContext, node sqlparser.SQLNod
return
}

func rewriteRemainingColumns(
func checkForCorrelatedSubqueries(
ctx *plancontext.PlanningContext,
stmt sqlparser.SelectStatement,
subqID semantics.TableSet,
) sqlparser.SelectStatement {
return sqlparser.CopyOnRewrite(stmt, nil, func(cursor *sqlparser.CopyOnWriteCursor) {
colname, isColname := cursor.Node().(*sqlparser.ColName)
) (correlated bool) {
_ = sqlparser.Walk(func(node sqlparser.SQLNode) (kontinue bool, err error) {
colname, isColname := node.(*sqlparser.ColName)
if !isColname {
return
return true, nil
}
deps := ctx.SemTable.RecursiveDeps(colname)
if deps.IsSolvedBy(subqID) {
return
return true, nil
}
rsv := ctx.GetReservedArgumentFor(colname)
cursor.Replace(sqlparser.NewArgument(rsv))
}, nil).(sqlparser.SelectStatement)
correlated = true
return false, nil
}, stmt)
return correlated
}

// joinPredicateCollector is used to inspect the predicates inside the subquery, looking for any
Expand Down
6 changes: 6 additions & 0 deletions go/vt/vtgate/planbuilder/operators/subquery.go
Original file line number Diff line number Diff line change
Expand Up @@ -49,6 +49,9 @@ type SubQuery struct {
// Fields related to correlated subqueries:
Vars map[string]int // Arguments copied from outer to inner, set during offset planning.
outerID semantics.TableSet
// correlated stores whether this subquery is correlated or not.
// We use this information to fail the planning if we are unable to merge the subquery with a route.
correlated bool

IsProjection bool
}
Expand Down Expand Up @@ -200,6 +203,9 @@ func (sq *SubQuery) settle(ctx *plancontext.PlanningContext, outer Operator) (Op
if !sq.TopLevel {
return nil, subqueryNotAtTopErr
}
if sq.correlated {
return nil, correlatedSubqueryErr
}
if sq.IsProjection {
if len(sq.GetMergePredicates()) > 0 {
// this means that we have a correlated subquery on our hands
Expand Down
8 changes: 3 additions & 5 deletions go/vt/vtgate/planbuilder/operators/subquery_builder.go
Original file line number Diff line number Diff line change
Expand Up @@ -169,12 +169,9 @@ func createSubquery(
sqc := &SubQueryBuilder{totalID: totalID, subqID: subqID, outerID: outerID}

predicates, joinCols := sqc.inspectStatement(ctx, subq.Select)
stmt := rewriteRemainingColumns(ctx, subq.Select, subqID)
correlated := checkForCorrelatedSubqueries(ctx, subq.Select, subqID)

// TODO: this should not be needed. We are using CopyOnRewrite above, but somehow this is not getting copied
ctx.SemTable.CopySemanticInfo(subq.Select, stmt)

opInner := translateQueryToOp(ctx, stmt)
opInner := translateQueryToOp(ctx, subq.Select)

opInner = sqc.getRootOperator(opInner, nil)
return &SubQuery{
Expand All @@ -187,6 +184,7 @@ func createSubquery(
IsProjection: isProjection,
TopLevel: topLevel,
JoinColumns: joinCols,
correlated: correlated,
}
}

Expand Down
8 changes: 4 additions & 4 deletions go/vt/vtgate/planbuilder/testdata/info_schema57_cases.json
Original file line number Diff line number Diff line change
Expand Up @@ -1037,10 +1037,10 @@
},
{
"comment": "merge even one side have schema name in subquery",
"query": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `COLUMN_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"query": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `TABLE_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"plan": {
"QueryType": "SELECT",
"Original": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `COLUMN_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"Original": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `TABLE_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"Instructions": {
"OperatorType": "UncorrelatedSubquery",
"Variant": "PulloutIn",
Expand All @@ -1066,8 +1066,8 @@
"Name": "main",
"Sharded": false
},
"FieldQuery": "select :COLUMN_NAME from information_schema.`tables` as t where 1 != 1",
"Query": "select distinct :COLUMN_NAME from information_schema.`tables` as t where t.TABLE_SCHEMA = :__vtschemaname /* VARCHAR */",
"FieldQuery": "select TABLE_NAME from information_schema.`tables` as t where 1 != 1",
"Query": "select distinct TABLE_NAME from information_schema.`tables` as t where t.TABLE_SCHEMA = :__vtschemaname /* VARCHAR */",
"SysTableTableSchema": "['a']",
"Table": "information_schema.`tables`"
},
Expand Down
8 changes: 4 additions & 4 deletions go/vt/vtgate/planbuilder/testdata/info_schema80_cases.json
Original file line number Diff line number Diff line change
Expand Up @@ -1102,10 +1102,10 @@
},
{
"comment": "merge even one side have schema name in subquery",
"query": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `COLUMN_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"query": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `TABLE_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"plan": {
"QueryType": "SELECT",
"Original": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `COLUMN_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"Original": "select `COLLATION_NAME` from information_schema.`COLUMNS` t where `COLUMN_NAME` in (select `TABLE_NAME` from information_schema.tables t where t.TABLE_SCHEMA = 'a' union select `COLUMN_NAME` from information_schema.columns)",
"Instructions": {
"OperatorType": "UncorrelatedSubquery",
"Variant": "PulloutIn",
Expand All @@ -1131,8 +1131,8 @@
"Name": "main",
"Sharded": false
},
"FieldQuery": "select :COLUMN_NAME from information_schema.`tables` as t where 1 != 1",
"Query": "select distinct :COLUMN_NAME from information_schema.`tables` as t where t.TABLE_SCHEMA = :__vtschemaname /* VARCHAR */",
"FieldQuery": "select TABLE_NAME from information_schema.`tables` as t where 1 != 1",
"Query": "select distinct TABLE_NAME from information_schema.`tables` as t where t.TABLE_SCHEMA = :__vtschemaname /* VARCHAR */",
"SysTableTableSchema": "['a']",
"Table": "information_schema.`tables`"
},
Expand Down
5 changes: 5 additions & 0 deletions go/vt/vtgate/planbuilder/testdata/unsupported_cases.json
Original file line number Diff line number Diff line change
Expand Up @@ -378,5 +378,10 @@
"comment": "Alias cannot clash with base tables",
"query": "WITH user AS (SELECT col FROM user) SELECT * FROM user",
"plan": "VT12001: unsupported: do not support CTE that use the CTE alias inside the CTE query"
},
{
"comment": "correlated subqueries in select expressions are unsupported",
"query": "SELECT (SELECT sum(user.name) FROM music LIMIT 1) FROM user",
"plan": "VT12001: unsupported: correlated subquery is only supported for EXISTS"
}
]

0 comments on commit 228930d

Please sign in to comment.