From b3744c8eb1e9c870574bc4866eac0041a56263ce Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Wed, 15 Sep 2021 10:19:25 +0200 Subject: [PATCH 01/10] Proper clone of joinTree's vars map Signed-off-by: Florent Poinsard --- go/vt/vtgate/planbuilder/jointree.go | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/go/vt/vtgate/planbuilder/jointree.go b/go/vt/vtgate/planbuilder/jointree.go index 4f9c2175852..f15e20e12a3 100644 --- a/go/vt/vtgate/planbuilder/jointree.go +++ b/go/vt/vtgate/planbuilder/jointree.go @@ -45,7 +45,10 @@ func (jp *joinTree) clone() queryTree { lhs: jp.lhs.clone(), rhs: jp.rhs.clone(), outer: jp.outer, - vars: jp.vars, + vars: make(map[string]int, len(jp.vars)), + } + for key, val := range jp.vars { + result.vars[key] = val } return result } From 10e4478326f0e703cf12d80590d7ce448cfe9618 Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Wed, 15 Sep 2021 11:21:14 +0200 Subject: [PATCH 02/10] Pushing join output columns on top of already existing output cols Signed-off-by: Florent Poinsard --- go/vt/vtgate/planbuilder/jointree.go | 12 +++++++----- 1 file changed, 7 insertions(+), 5 deletions(-) diff --git a/go/vt/vtgate/planbuilder/jointree.go b/go/vt/vtgate/planbuilder/jointree.go index f15e20e12a3..c1753cc70e1 100644 --- a/go/vt/vtgate/planbuilder/jointree.go +++ b/go/vt/vtgate/planbuilder/jointree.go @@ -42,10 +42,11 @@ func (jp *joinTree) tableID() semantics.TableSet { func (jp *joinTree) clone() queryTree { result := &joinTree{ - lhs: jp.lhs.clone(), - rhs: jp.rhs.clone(), - outer: jp.outer, - vars: make(map[string]int, len(jp.vars)), + lhs: jp.lhs.clone(), + rhs: jp.rhs.clone(), + outer: jp.outer, + columns: jp.columns, + vars: make(map[string]int, len(jp.vars)), } for key, val := range jp.vars { result.vars[key] = val @@ -81,8 +82,9 @@ func (jp *joinTree) pushOutputColumns(columns []*sqlparser.ColName, semTable *se outputColumns := make([]int, len(toTheLeft)) var l, r int + originalColSize := len(jp.vars) for i, isLeft := range toTheLeft { - outputColumns[i] = i + outputColumns[i] = i + originalColSize if isLeft { jp.columns = append(jp.columns, -lhsOffset[l]-1) l++ From d1bff26b29f9f51aec2ffd11f2b61bbf5c190e7d Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Wed, 15 Sep 2021 13:04:02 +0200 Subject: [PATCH 03/10] Pushing comparison containing argument on join in a different way to ensure dependencies Signed-off-by: Florent Poinsard --- go/vt/vtgate/planbuilder/route_planning.go | 196 +++++++++++++++------ 1 file changed, 138 insertions(+), 58 deletions(-) diff --git a/go/vt/vtgate/planbuilder/route_planning.go b/go/vt/vtgate/planbuilder/route_planning.go index 2623ecdf2f6..102457ce8d4 100644 --- a/go/vt/vtgate/planbuilder/route_planning.go +++ b/go/vt/vtgate/planbuilder/route_planning.go @@ -405,82 +405,162 @@ func stripDownQuery(from, to sqlparser.SelectStatement) error { } func pushJoinPredicate(ctx planningContext, exprs []sqlparser.Expr, tree queryTree) (queryTree, error) { + if len(exprs) == 0 { + return tree, nil + } switch node := tree.(type) { case *routeTree: - plan := node.clone().(*routeTree) - err := plan.addPredicate(ctx, exprs...) + return pushJoinPredicateOnRoute(ctx, exprs, node) + case *joinTree: + return pushJoinPredicateOnJoin(ctx, exprs, node) + case *derivedTree: + return pushJoinPredicateOnDerived(ctx, exprs, node) + case *vindexTree: + // vindexFunc cannot accept predicates from the other side of a join + return node, nil + default: + panic(fmt.Sprintf("BUG: unknown type %T", node)) + } +} + +func pushJoinPredicateOnRoute(ctx planningContext, exprs []sqlparser.Expr, node *routeTree) (queryTree, error) { + plan := node.clone().(*routeTree) + err := plan.addPredicate(ctx, exprs...) + if err != nil { + return nil, err + } + return plan, nil +} + +func pushJoinPredicateOnDerived(ctx planningContext, exprs []sqlparser.Expr, node *derivedTree) (queryTree, error) { + plan := node.clone().(*derivedTree) + + newExpressions := make([]sqlparser.Expr, 0, len(exprs)) + for _, expr := range exprs { + tblInfo, err := ctx.semTable.TableInfoForExpr(expr) if err != nil { return nil, err } - return plan, nil - - case *joinTree: - node = node.clone().(*joinTree) - - // we break up the predicates so that colnames from the LHS are replaced by arguments - var rhsPreds []sqlparser.Expr - var lhsColumns []*sqlparser.ColName - var lhsVarsName []string - lhsSolves := node.lhs.tableID() - for _, expr := range exprs { - bvName, cols, predicate, err := breakPredicateInLHSandRHS(expr, ctx.semTable, lhsSolves) - if err != nil { - return nil, err - } - lhsColumns = append(lhsColumns, cols...) - lhsVarsName = append(lhsVarsName, bvName...) - rhsPreds = append(rhsPreds, predicate) - } - if lhsColumns != nil && lhsVarsName != nil { - idxs, err := node.pushOutputColumns(lhsColumns, ctx.semTable) - if err != nil { - return nil, err - } - for i, idx := range idxs { - node.vars[lhsVarsName[i]] = idx - } + rewritten, err := semantics.RewriteDerivedExpression(expr, tblInfo) + if err != nil { + return nil, err } + newExpressions = append(newExpressions, rewritten) + } - rhsPlan, err := pushJoinPredicate(ctx, rhsPreds, node.rhs) + newInner, err := pushJoinPredicate(ctx, newExpressions, plan.inner) + if err != nil { + return nil, err + } + + plan.inner = newInner + return plan, nil +} + +func pushJoinPredicateOnJoin(ctx planningContext, exprs []sqlparser.Expr, node *joinTree) (queryTree, error) { + node = node.clone().(*joinTree) + + var rhsPreds []sqlparser.Expr + var lhsColumns []*sqlparser.ColName + var lhsVarsName []string + + for _, expr := range exprs { + // we are pushing argument expression in a different way, if one side + // of the comparison is an argument (*sqlparser.Argument) coming from + // then we can push the expression to either left or right hand side + // (depending on who solves the expression). such expression do not + // need to be "outputed" and sent to the RHS of the join as we would + // usually do. + newNode, err := pushArgumentsOnJoin(ctx, expr, node) if err != nil { return nil, err } + if newNode != nil { + // we are getting a new node from pushArgumentsOnJoin, meaning + // we do not need to break the predicate between LHS and RHS, thus we + // continue onto the following expression. + node = newNode + continue + } - return &joinTree{ - lhs: node.lhs, - rhs: rhsPlan, - outer: node.outer, - vars: node.vars, - }, nil - case *derivedTree: - plan := node.clone().(*derivedTree) - - newExpressions := make([]sqlparser.Expr, 0, len(exprs)) - for _, expr := range exprs { - tblInfo, err := ctx.semTable.TableInfoForExpr(expr) - if err != nil { - return nil, err - } - rewritten, err := semantics.RewriteDerivedExpression(expr, tblInfo) - if err != nil { - return nil, err - } - newExpressions = append(newExpressions, rewritten) + bvName, cols, predicate, err := breakPredicateInLHSandRHS(expr, ctx.semTable, node.lhs.tableID()) + if err != nil { + return nil, err } + lhsColumns = append(lhsColumns, cols...) + lhsVarsName = append(lhsVarsName, bvName...) + rhsPreds = append(rhsPreds, predicate) + } - newInner, err := pushJoinPredicate(ctx, newExpressions, plan.inner) + if lhsColumns != nil && lhsVarsName != nil { + idxs, err := node.pushOutputColumns(lhsColumns, ctx.semTable) if err != nil { return nil, err } + for i, idx := range idxs { + node.vars[lhsVarsName[i]] = idx + } + } - plan.inner = newInner - return plan, nil - case *vindexTree: - // vindexFunc cannot accept predicates from the other side of a join - return node, nil - default: - panic(fmt.Sprintf("BUG: unknown type %T", node)) + rhsPlan, err := pushJoinPredicate(ctx, rhsPreds, node.rhs) + if err != nil { + return nil, err } + return &joinTree{ + lhs: node.lhs, + rhs: rhsPlan, + outer: node.outer, + vars: node.vars, + }, nil +} + +func pushArgumentsOnJoin(ctx planningContext, expr sqlparser.Expr, node *joinTree) (*joinTree, error) { + cmp, isCmp := expr.(*sqlparser.ComparisonExpr) + if !isCmp { + return nil, nil + } + + solvedByLeft, solvedByRight := isComparisonExprSolvedByJoinTree(ctx, cmp, node) + if !solvedByLeft && !solvedByRight { + return nil, nil + } + + var nodeToReplace queryTree + if solvedByLeft { + nodeToReplace = node.lhs + } else if solvedByRight { + nodeToReplace = node.rhs + } + + newNode, err := pushJoinPredicate(ctx, []sqlparser.Expr{expr}, nodeToReplace) + if err != nil { + return nil, err + } + + if solvedByLeft { + node.lhs = newNode + } else if solvedByRight { + node.rhs = newNode + } + return node, nil +} + +func isComparisonExprSolvedByJoinTree(ctx planningContext, cmp *sqlparser.ComparisonExpr, node *joinTree) (bool, bool) { + var argExpr sqlparser.Expr + _, isLeftArg := cmp.Left.(sqlparser.Argument) + _, isRightArg := cmp.Right.(sqlparser.Argument) + if isLeftArg { + argExpr = cmp.Right + } else if isRightArg { + argExpr = cmp.Left + } else { + return false, false + } + + argDeps := ctx.semTable.RecursiveDeps(argExpr) + solvedByLeft := argDeps.IsSolvedBy(node.lhs.tableID()) + solvedByRight := argDeps.IsSolvedBy(node.rhs.tableID()) + return solvedByLeft, solvedByRight } func breakPredicateInLHSandRHS( From 15ec369ca38cd20a33b36477ec95a21c6e7ad681 Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Wed, 15 Sep 2021 13:05:00 +0200 Subject: [PATCH 04/10] creation of a ruby on rails plan test that tests Rails queries Signed-off-by: Florent Poinsard --- go/vt/vtgate/planbuilder/plan_test.go | 17 + .../planbuilder/testdata/rails_cases.txt | 206 +++++++++++ .../testdata/rails_schema_test.json | 321 ++++++++++++++++++ 3 files changed, 544 insertions(+) create mode 100644 go/vt/vtgate/planbuilder/testdata/rails_cases.txt create mode 100644 go/vt/vtgate/planbuilder/testdata/rails_schema_test.json diff --git a/go/vt/vtgate/planbuilder/plan_test.go b/go/vt/vtgate/planbuilder/plan_test.go index ffc014d2648..583a105f6c9 100644 --- a/go/vt/vtgate/planbuilder/plan_test.go +++ b/go/vt/vtgate/planbuilder/plan_test.go @@ -218,6 +218,23 @@ func TestOne(t *testing.T) { testFile(t, "onecase.txt", "", vschema, true) } +func TestRubyOnRailsQueries(t *testing.T) { + vschemaWrapper := &vschemaWrapper{ + v: loadSchema(t, "rails_schema_test.json"), + sysVarEnabled: true, + } + + testOutputTempDir, err := ioutil.TempDir("", "plan_test") + require.NoError(t, err) + defer func() { + if !t.Failed() { + os.RemoveAll(testOutputTempDir) + } + }() + + testFile(t, "rails_cases.txt", testOutputTempDir, vschemaWrapper, true) +} + func TestOLTP(t *testing.T) { vschemaWrapper := &vschemaWrapper{ v: loadSchema(t, "oltp_schema_test.json"), diff --git a/go/vt/vtgate/planbuilder/testdata/rails_cases.txt b/go/vt/vtgate/planbuilder/testdata/rails_cases.txt new file mode 100644 index 00000000000..4dfbf463125 --- /dev/null +++ b/go/vt/vtgate/planbuilder/testdata/rails_cases.txt @@ -0,0 +1,206 @@ +# Author5.joins(books: [{orders: :customer}, :supplier]) +"select author5s.* from author5s join book6s on book6s.author5_id = author5s.id join book6s_order2s on book6s_order2s.book6_id = book6s.id join order2s on order2s.id = book6s_order2s.order2_id join customer2s on customer2s.id = order2s.customer2_id join supplier5s on supplier5s.id = book6s.supplier5_id" +{ + "QueryType": "SELECT", + "Original": "select author5s.* from author5s join book6s on book6s.author5_id = author5s.id join book6s_order2s on book6s_order2s.book6_id = book6s.id join order2s on order2s.id = book6s_order2s.order2_id join customer2s on customer2s.id = order2s.customer2_id join supplier5s on supplier5s.id = book6s.supplier5_id", + "Instructions": { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "-1,-2,-3,-4", + "JoinVars": { + "book6s_supplier5_id": 4 + }, + "TableName": "author5s, book6s_book6s_order2s_order2s_customer2s_supplier5s", + "Inputs": [ + { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "-1,-2,-3,-4,-5", + "JoinVars": { + "order2s_customer2_id": 5 + }, + "TableName": "author5s, book6s_book6s_order2s_order2s_customer2s", + "Inputs": [ + { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "-1,-2,-3,-4,-5,1", + "JoinVars": { + "book6s_order2s_order2_id": 5 + }, + "TableName": "author5s, book6s_book6s_order2s_order2s", + "Inputs": [ + { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "-1,-2,-3,-4,-5,1", + "JoinVars": { + "book6s_id": 5 + }, + "TableName": "author5s, book6s_book6s_order2s", + "Inputs": [ + { + "OperatorType": "Route", + "Variant": "SelectScatter", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select author5s.id, author5s.`name`, author5s.created_at, author5s.updated_at, book6s.supplier5_id, book6s.id from author5s join book6s on book6s.author5_id = author5s.id where 1 != 1", + "Query": "select author5s.id, author5s.`name`, author5s.created_at, author5s.updated_at, book6s.supplier5_id, book6s.id from author5s join book6s on book6s.author5_id = author5s.id", + "Table": "author5s, book6s" + }, + { + "OperatorType": "Route", + "Variant": "SelectEqualUnique", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select book6s_order2s.order2_id from book6s_order2s where 1 != 1", + "Query": "select book6s_order2s.order2_id from book6s_order2s where book6s_order2s.book6_id = :book6s_id", + "Table": "book6s_order2s", + "Values": [ + ":book6s_id" + ], + "Vindex": "binary_md5" + } + ] + }, + { + "OperatorType": "Route", + "Variant": "SelectScatter", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select order2s.customer2_id from order2s where 1 != 1", + "Query": "select order2s.customer2_id from order2s where order2s.id = :book6s_order2s_order2_id", + "Table": "order2s" + } + ] + }, + { + "OperatorType": "Route", + "Variant": "SelectEqualUnique", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select 1 from customer2s where 1 != 1", + "Query": "select 1 from customer2s where customer2s.id = :order2s_customer2_id", + "Table": "customer2s", + "Values": [ + ":order2s_customer2_id" + ], + "Vindex": "binary_md5" + } + ] + }, + { + "OperatorType": "Route", + "Variant": "SelectEqualUnique", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select 1 from supplier5s where 1 != 1", + "Query": "select 1 from supplier5s where supplier5s.id = :book6s_supplier5_id", + "Table": "supplier5s", + "Values": [ + ":book6s_supplier5_id" + ], + "Vindex": "binary_md5" + } + ] + } +} +{ + "QueryType": "SELECT", + "Original": "select author5s.* from author5s join book6s on book6s.author5_id = author5s.id join book6s_order2s on book6s_order2s.book6_id = book6s.id join order2s on order2s.id = book6s_order2s.order2_id join customer2s on customer2s.id = order2s.customer2_id join supplier5s on supplier5s.id = book6s.supplier5_id", + "Instructions": { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "1,2,3,4", + "JoinVars": { + "order2s_id": 0 + }, + "TableName": "customer2s, order2s_author5s, book6s_book6s_order2s_supplier5s", + "Inputs": [ + { + "OperatorType": "Route", + "Variant": "SelectScatter", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select order2s.id from order2s, customer2s where 1 != 1", + "Query": "select order2s.id from order2s, customer2s where customer2s.id = order2s.customer2_id", + "Table": "customer2s, order2s" + }, + { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "-1,-2,-3,-4", + "JoinVars": { + "book6s_supplier5_id": 0 + }, + "TableName": "author5s, book6s_book6s_order2s_supplier5s", + "Inputs": [ + { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "-3,-4,-5,-6", + "JoinVars": { + "book6s_id": 0 + }, + "TableName": "author5s, book6s_book6s_order2s", + "Inputs": [ + { + "OperatorType": "Route", + "Variant": "SelectScatter", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select book6s.id, book6s.supplier5_id, author5s.id as id, author5s.`name` as `name`, author5s.created_at as created_at, author5s.updated_at as updated_at from author5s, book6s where 1 != 1", + "Query": "select book6s.id, book6s.supplier5_id, author5s.id as id, author5s.`name` as `name`, author5s.created_at as created_at, author5s.updated_at as updated_at from author5s, book6s where book6s.author5_id = author5s.id", + "Table": "author5s, book6s" + }, + { + "OperatorType": "Route", + "Variant": "SelectEqualUnique", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select 1 from book6s_order2s where 1 != 1", + "Query": "select 1 from book6s_order2s where book6s_order2s.book6_id = :book6s_id and book6s_order2s.order2_id = :order2s_id", + "Table": "book6s_order2s", + "Values": [ + ":book6s_id" + ], + "Vindex": "binary_md5" + } + ] + }, + { + "OperatorType": "Route", + "Variant": "SelectEqualUnique", + "Keyspace": { + "Name": "user", + "Sharded": true + }, + "FieldQuery": "select 1 from supplier5s where 1 != 1", + "Query": "select 1 from supplier5s where supplier5s.id = :book6s_supplier5_id", + "Table": "supplier5s", + "Values": [ + ":book6s_supplier5_id" + ], + "Vindex": "binary_md5" + } + ] + } + ] + } +} diff --git a/go/vt/vtgate/planbuilder/testdata/rails_schema_test.json b/go/vt/vtgate/planbuilder/testdata/rails_schema_test.json new file mode 100644 index 00000000000..26e0ec1dec7 --- /dev/null +++ b/go/vt/vtgate/planbuilder/testdata/rails_schema_test.json @@ -0,0 +1,321 @@ +{ + "keyspaces": { + "user": { + "sharded": true, + "vindexes": { + "binary_md5": { + "type": "hash_test" + } + }, + "tables": { + "order2s": { + "column_vindexes": [ + { + "columns": [ + "customer2_id" + ], + "name": "binary_md5" + } + ], + "auto_increment": { + "column": "id", + "sequence": "order2s_seq" + }, + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "customer2_id", + "type": "INT64" + }, + { + "name": "status", + "type": "INT32" + }, + { + "name": "created_at", + "type": "DATETIME" + }, + { + "name": "updated_at", + "type": "DATETIME" + } + ], + "column_list_authoritative": true + }, + "book6s": { + "column_vindexes": [ + { + "columns": [ + "author5_id" + ], + "name": "binary_md5" + } + ], + "auto_increment": { + "column": "id", + "sequence": "book6s_seq" + }, + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "author5_id", + "type": "INT64" + }, + { + "name": "supplier5_id", + "type": "INT64" + }, + { + "name": "title", + "type": "VARCHAR" + }, + { + "name": "price", + "type": "INT32" + }, + { + "name": "year_published", + "type": "INT32" + }, + { + "name": "out_of_print", + "type": "INT8" + }, + { + "name": "created_at", + "type": "DATETIME" + }, + { + "name": "updated_at", + "type": "DATETIME" + } + ], + "column_list_authoritative": true + }, + "book6s_order2s": { + "column_vindexes": [ + { + "columns": [ + "book6_id" + ], + "name": "binary_md5" + } + ], + "columns": [ + { + "name": "book6_id", + "type": "INT64" + }, + { + "name": "order2_id", + "type": "INT64" + } + ], + "column_list_authoritative": true + }, + "customer2s": { + "column_vindexes": [ + { + "columns": [ + "id" + ], + "name": "binary_md5" + } + ], + "auto_increment": { + "column": "id", + "sequence": "customer2s_seq" + }, + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "first_name", + "type": "VARCHAR" + }, + { + "name": "orders_count", + "type": "INT32" + }, + { + "name": "lock_version", + "type": "INT32" + }, + { + "name": "created_at", + "type": "DATETIME" + }, + { + "name": "updated_at", + "type": "DATETIME" + } + ], + "column_list_authoritative": true + }, + "author5s": { + "column_vindexes": [ + { + "columns": [ + "id" + ], + "name": "binary_md5" + } + ], + "auto_increment": { + "column": "id", + "sequence": "author5s_seq" + }, + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "name", + "type": "VARCHAR" + }, + { + "name": "created_at", + "type": "DATETIME" + }, + { + "name": "updated_at", + "type": "DATETIME" + } + ], + "column_list_authoritative": true + }, + "supplier5s": { + "column_vindexes": [ + { + "columns": [ + "id" + ], + "name": "binary_md5" + } + ], + "auto_increment": { + "column": "id", + "sequence": "supplier5s_seq" + }, + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "state", + "type": "VARCHAR" + }, + { + "name": "created_at", + "type": "DATETIME" + }, + { + "name": "updated_at", + "type": "DATETIME" + } + ], + "column_list_authoritative": true + } + } + }, + "main": { + "tables": { + "book6s_seq": { + "type": "sequence", + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "next_id", + "type": "INT64" + }, + { + "name": "cache", + "type": "INT64" + } + ], + "column_list_authoritative": true + }, + "author5s_seq": { + "type": "sequence", + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "next_id", + "type": "INT64" + }, + { + "name": "cache", + "type": "INT64" + } + ], + "column_list_authoritative": true + }, + "supplier5s_seq": { + "type": "sequence", + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "next_id", + "type": "INT64" + }, + { + "name": "cache", + "type": "INT64" + } + ], + "column_list_authoritative": true + }, + "customer2s_seq": { + "type": "sequence", + "columns": [ + { + "name": "id", + "type": "INT64" + }, + { + "name": "next_id", + "type": "INT64" + }, + { + "name": "cache", + "type": "INT64" + } + ], + "column_list_authoritative": true + }, + "order2s_seq": { + "type": "sequence", + "columns": [ + { + "name": "predef1" + }, + { + "name": "cache", + "type": "INT64" + } + ], + "column_list_authoritative": true + } + } + } + } +} From 6260918c0c0245d8f7f8be3178d5184cd9763334 Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Wed, 15 Sep 2021 13:05:41 +0200 Subject: [PATCH 05/10] Updated plan tests expected output for Gen4 Signed-off-by: Florent Poinsard --- .../planbuilder/testdata/from_cases.txt | 19 ++- .../planbuilder/testdata/tpch_cases.txt | 155 +++++++++--------- .../planbuilder/testdata/wireup_cases.txt | 9 +- 3 files changed, 92 insertions(+), 91 deletions(-) diff --git a/go/vt/vtgate/planbuilder/testdata/from_cases.txt b/go/vt/vtgate/planbuilder/testdata/from_cases.txt index 9ee168b908b..6be80853958 100644 --- a/go/vt/vtgate/planbuilder/testdata/from_cases.txt +++ b/go/vt/vtgate/planbuilder/testdata/from_cases.txt @@ -642,7 +642,7 @@ Gen4 plan same as above "Sharded": true }, "FieldQuery": "select e.col from user_extra as e where 1 != 1", - "Query": "select e.col from user_extra as e", + "Query": "select e.col from user_extra as e where e.col = :user_col", "Table": "user_extra" }, { @@ -653,7 +653,7 @@ Gen4 plan same as above "Sharded": false }, "FieldQuery": "select 1 from unsharded as m1 where 1 != 1", - "Query": "select 1 from unsharded as m1 where m1.col = :e_col and :user_col = :e_col", + "Query": "select 1 from unsharded as m1 where m1.col = :e_col", "Table": "unsharded" } ] @@ -2605,21 +2605,22 @@ Gen4 plan same as above "OperatorType": "Join", "Variant": "Join", "JoinColumnIndexes": "-1,-2", - "JoinVars": { - "user_id": 0 - }, "TableName": "`user`_user_extra", "Inputs": [ { "OperatorType": "Route", - "Variant": "SelectScatter", + "Variant": "SelectEqualUnique", "Keyspace": { "Name": "user", "Sharded": true }, "FieldQuery": "select `user`.id, `user`.col1 from `user` where 1 != 1", - "Query": "select `user`.id, `user`.col1 from `user`", - "Table": "`user`" + "Query": "select `user`.id, `user`.col1 from `user` where `user`.id = :ua_id", + "Table": "`user`", + "Values": [ + ":ua_id" + ], + "Vindex": "user_index" }, { "OperatorType": "Route", @@ -2629,7 +2630,7 @@ Gen4 plan same as above "Sharded": true }, "FieldQuery": "select 1 from user_extra where 1 != 1", - "Query": "select 1 from user_extra where :user_id = :ua_id", + "Query": "select 1 from user_extra", "Table": "user_extra" } ] diff --git a/go/vt/vtgate/planbuilder/testdata/tpch_cases.txt b/go/vt/vtgate/planbuilder/testdata/tpch_cases.txt index 2c7629cc2ae..4346419f04d 100644 --- a/go/vt/vtgate/planbuilder/testdata/tpch_cases.txt +++ b/go/vt/vtgate/planbuilder/testdata/tpch_cases.txt @@ -38,32 +38,46 @@ Gen4 error: unsupported: cross-shard correlated subquery { "OperatorType": "Join", "Variant": "Join", - "JoinColumnIndexes": "1,2,-2,-3,3,-4,-5", + "JoinColumnIndexes": "-1,-2,1,2,-3,3,4", "JoinVars": { - "o_orderkey": 0 + "l_orderkey": 0 }, - "TableName": "orders_customer_lineitem", + "TableName": "lineitem_orders_customer", "Inputs": [ + { + "OperatorType": "Route", + "Variant": "SelectScatter", + "Keyspace": { + "Name": "main", + "Sharded": true + }, + "FieldQuery": "select l_orderkey, sum(l_extendedprice * (1 - l_discount)) as revenue, weight_string(l_orderkey) from lineitem where 1 != 1", + "Query": "select l_orderkey, sum(l_extendedprice * (1 - l_discount)) as revenue, weight_string(l_orderkey) from lineitem where l_shipdate \u003e date('1995-03-15')", + "Table": "lineitem" + }, { "OperatorType": "Join", "Variant": "Join", - "JoinColumnIndexes": "-2,-3,-4,-5,-6", + "JoinColumnIndexes": "-2,-3,-4,-5", "JoinVars": { - "o_custkey": 0, - "o_orderkey": 0 + "o_custkey": 0 }, "TableName": "orders_customer", "Inputs": [ { "OperatorType": "Route", - "Variant": "SelectScatter", + "Variant": "SelectEqualUnique", "Keyspace": { "Name": "main", "Sharded": true }, - "FieldQuery": "select o_custkey, o_orderkey, o_orderdate, o_shippriority, weight_string(o_orderdate), weight_string(o_shippriority) from orders where 1 != 1", - "Query": "select o_custkey, o_orderkey, o_orderdate, o_shippriority, weight_string(o_orderdate), weight_string(o_shippriority) from orders where o_orderdate \u003c date('1995-03-15')", - "Table": "orders" + "FieldQuery": "select o_custkey, o_orderdate, o_shippriority, weight_string(o_orderdate), weight_string(o_shippriority) from orders where 1 != 1", + "Query": "select o_custkey, o_orderdate, o_shippriority, weight_string(o_orderdate), weight_string(o_shippriority) from orders where o_orderdate \u003c date('1995-03-15') and o_orderkey = :l_orderkey", + "Table": "orders", + "Values": [ + ":l_orderkey" + ], + "Vindex": "hash" }, { "OperatorType": "Route", @@ -81,21 +95,6 @@ Gen4 error: unsupported: cross-shard correlated subquery "Vindex": "hash" } ] - }, - { - "OperatorType": "Route", - "Variant": "SelectEqualUnique", - "Keyspace": { - "Name": "main", - "Sharded": true - }, - "FieldQuery": "select l_orderkey, sum(l_extendedprice * (1 - l_discount)) as revenue, weight_string(l_orderkey) from lineitem where 1 != 1", - "Query": "select l_orderkey, sum(l_extendedprice * (1 - l_discount)) as revenue, weight_string(l_orderkey) from lineitem where l_shipdate \u003e date('1995-03-15') and l_orderkey = :o_orderkey", - "Table": "lineitem", - "Values": [ - ":o_orderkey" - ], - "Vindex": "lineitem_map" } ] } @@ -202,39 +201,79 @@ Gen4 plan same as above "GroupBy": "(0|8), (1|9), (3|10), (6|11), (4|12), (5|13), (7|14)", "Inputs": [ { - "OperatorType": "Join", - "Variant": "Join", - "JoinColumnIndexes": "-1,-2,1,-3,-4,-5,-6,-7,-8,-9,-10,-11,-12,-13,-14", - "JoinVars": { - "c_custkey": 0 - }, - "TableName": "customer_nation_orders_lineitem", + "OperatorType": "Sort", + "Variant": "Memory", + "OrderBy": "(0|8) ASC, (1|9) ASC, (3|10) ASC, (6|11) ASC, (4|12) ASC, (5|13) ASC, (7|14) ASC", "Inputs": [ { - "OperatorType": "Sort", - "Variant": "Memory", - "OrderBy": "(0|7) ASC, (1|8) ASC, (2|9) ASC, (5|10) ASC, (3|11) ASC, (4|12) ASC, (6|13) ASC", + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "1,2,-2,3,4,5,6,7,8,9,10,11,12,13,14", + "JoinVars": { + "o_custkey": 0 + }, + "TableName": "orders_lineitem_customer_nation", "Inputs": [ + { + "OperatorType": "Join", + "Variant": "Join", + "JoinColumnIndexes": "-2,1", + "JoinVars": { + "o_orderkey": 0 + }, + "TableName": "orders_lineitem", + "Inputs": [ + { + "OperatorType": "Route", + "Variant": "SelectScatter", + "Keyspace": { + "Name": "main", + "Sharded": true + }, + "FieldQuery": "select o_orderkey, o_custkey from orders where 1 != 1", + "Query": "select o_orderkey, o_custkey from orders where o_orderdate \u003e= date('1993-10-01') and o_orderdate \u003c date('1993-10-01') + interval '3' month", + "Table": "orders" + }, + { + "OperatorType": "Route", + "Variant": "SelectEqualUnique", + "Keyspace": { + "Name": "main", + "Sharded": true + }, + "FieldQuery": "select sum(l_extendedprice * (1 - l_discount)) as revenue from lineitem where 1 != 1", + "Query": "select sum(l_extendedprice * (1 - l_discount)) as revenue from lineitem where l_returnflag = 'R' and l_orderkey = :o_orderkey", + "Table": "lineitem", + "Values": [ + ":o_orderkey" + ], + "Vindex": "lineitem_map" + } + ] + }, { "OperatorType": "Join", "Variant": "Join", "JoinColumnIndexes": "-2,-3,-4,1,-5,-6,-7,-8,-9,-10,-11,2,-12,-13", "JoinVars": { - "c_custkey": 0, "c_nationkey": 0 }, "TableName": "customer_nation", "Inputs": [ { "OperatorType": "Route", - "Variant": "SelectScatter", + "Variant": "SelectEqualUnique", "Keyspace": { "Name": "main", "Sharded": true }, "FieldQuery": "select c_nationkey, c_custkey, c_name, c_acctbal, c_address, c_phone, c_comment, weight_string(c_custkey), weight_string(c_name), weight_string(c_acctbal), weight_string(c_phone), weight_string(c_address), weight_string(c_comment) from customer where 1 != 1", - "Query": "select c_nationkey, c_custkey, c_name, c_acctbal, c_address, c_phone, c_comment, weight_string(c_custkey), weight_string(c_name), weight_string(c_acctbal), weight_string(c_phone), weight_string(c_address), weight_string(c_comment) from customer", - "Table": "customer" + "Query": "select c_nationkey, c_custkey, c_name, c_acctbal, c_address, c_phone, c_comment, weight_string(c_custkey), weight_string(c_name), weight_string(c_acctbal), weight_string(c_phone), weight_string(c_address), weight_string(c_comment) from customer where c_custkey = :o_custkey", + "Table": "customer", + "Values": [ + ":o_custkey" + ], + "Vindex": "hash" }, { "OperatorType": "Route", @@ -254,44 +293,6 @@ Gen4 plan same as above ] } ] - }, - { - "OperatorType": "Join", - "Variant": "Join", - "JoinColumnIndexes": "1", - "JoinVars": { - "o_custkey": 0, - "o_orderkey": 0 - }, - "TableName": "orders_lineitem", - "Inputs": [ - { - "OperatorType": "Route", - "Variant": "SelectScatter", - "Keyspace": { - "Name": "main", - "Sharded": true - }, - "FieldQuery": "select o_orderkey, o_custkey from orders where 1 != 1", - "Query": "select o_orderkey, o_custkey from orders where o_orderdate \u003e= date('1993-10-01') and o_orderdate \u003c date('1993-10-01') + interval '3' month", - "Table": "orders" - }, - { - "OperatorType": "Route", - "Variant": "SelectEqualUnique", - "Keyspace": { - "Name": "main", - "Sharded": true - }, - "FieldQuery": "select sum(l_extendedprice * (1 - l_discount)) as revenue from lineitem where 1 != 1", - "Query": "select sum(l_extendedprice * (1 - l_discount)) as revenue from lineitem where l_returnflag = 'R' and l_orderkey = :o_orderkey and :c_custkey = :o_custkey", - "Table": "lineitem", - "Values": [ - ":o_orderkey" - ], - "Vindex": "lineitem_map" - } - ] } ] } diff --git a/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt b/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt index 54cb40259bd..e623f73f77d 100644 --- a/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt +++ b/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt @@ -491,7 +491,7 @@ "Sharded": true }, "FieldQuery": "select u1.col, u1.id from `user` as u1 where 1 != 1", - "Query": "select u1.col, u1.id from `user` as u1", + "Query": "select u1.col, u1.id from `user` as u1 where u1.col = :u3_col", "Table": "`user`" }, { @@ -502,7 +502,7 @@ "Sharded": true }, "FieldQuery": "select 1 from `user` as u2 where 1 != 1", - "Query": "select 1 from `user` as u2 where u2.col = :u1_col and :u3_col = :u1_col", + "Query": "select 1 from `user` as u2 where u2.col = :u1_col", "Table": "`user`" } ] @@ -655,7 +655,7 @@ "Sharded": true }, "FieldQuery": "select u1.col, u1.id from `user` as u1 where 1 != 1", - "Query": "select u1.col, u1.id from `user` as u1", + "Query": "select u1.col, u1.id from `user` as u1 where u1.col = :u4_col", "Table": "`user`" }, { @@ -666,7 +666,7 @@ "Sharded": true }, "FieldQuery": "select 1 from `user` as u3 where 1 != 1", - "Query": "select 1 from `user` as u3 where u3.id = :u1_col and :u4_col = :u1_col", + "Query": "select 1 from `user` as u3 where u3.id = :u1_col", "Table": "`user`", "Values": [ ":u1_col" @@ -680,7 +680,6 @@ ] } } - # Test reuse of join var already being supplied to the right of a node. "select u1.id from user u1 join (user u2 join user u3) where u2.id = u1.col and u3.id = u1.col" { From 917c344491945b593ae3937856891ae8561917fb Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Wed, 15 Sep 2021 16:02:02 +0200 Subject: [PATCH 06/10] Removed unrequired clone of joinTree's vars map Signed-off-by: Florent Poinsard --- go/vt/vtgate/planbuilder/jointree.go | 15 +++++---------- 1 file changed, 5 insertions(+), 10 deletions(-) diff --git a/go/vt/vtgate/planbuilder/jointree.go b/go/vt/vtgate/planbuilder/jointree.go index c1753cc70e1..4f9c2175852 100644 --- a/go/vt/vtgate/planbuilder/jointree.go +++ b/go/vt/vtgate/planbuilder/jointree.go @@ -42,14 +42,10 @@ func (jp *joinTree) tableID() semantics.TableSet { func (jp *joinTree) clone() queryTree { result := &joinTree{ - lhs: jp.lhs.clone(), - rhs: jp.rhs.clone(), - outer: jp.outer, - columns: jp.columns, - vars: make(map[string]int, len(jp.vars)), - } - for key, val := range jp.vars { - result.vars[key] = val + lhs: jp.lhs.clone(), + rhs: jp.rhs.clone(), + outer: jp.outer, + vars: jp.vars, } return result } @@ -82,9 +78,8 @@ func (jp *joinTree) pushOutputColumns(columns []*sqlparser.ColName, semTable *se outputColumns := make([]int, len(toTheLeft)) var l, r int - originalColSize := len(jp.vars) for i, isLeft := range toTheLeft { - outputColumns[i] = i + originalColSize + outputColumns[i] = i if isLeft { jp.columns = append(jp.columns, -lhsOffset[l]-1) l++ From b89c726882b6d366942136bb3baf905f1a8d0625 Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Wed, 15 Sep 2021 16:32:09 +0200 Subject: [PATCH 07/10] Reverted unwanted change Signed-off-by: Florent Poinsard --- go/vt/vtgate/planbuilder/testdata/wireup_cases.txt | 1 + 1 file changed, 1 insertion(+) diff --git a/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt b/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt index e623f73f77d..487b1d97583 100644 --- a/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt +++ b/go/vt/vtgate/planbuilder/testdata/wireup_cases.txt @@ -680,6 +680,7 @@ ] } } + # Test reuse of join var already being supplied to the right of a node. "select u1.id from user u1 join (user u2 join user u3) where u2.id = u1.col and u3.id = u1.col" { From 3e31961e4008756c4ed9c208e441b5cb5e8e2b90 Mon Sep 17 00:00:00 2001 From: Manan Gupta Date: Thu, 16 Sep 2021 11:13:37 +0530 Subject: [PATCH 08/10] made join planning simpler Signed-off-by: Manan Gupta --- go/vt/vtgate/planbuilder/route_planning.go | 87 ++++++---------------- 1 file changed, 22 insertions(+), 65 deletions(-) diff --git a/go/vt/vtgate/planbuilder/route_planning.go b/go/vt/vtgate/planbuilder/route_planning.go index c60e756b9d9..cf56ac11929 100644 --- a/go/vt/vtgate/planbuilder/route_planning.go +++ b/go/vt/vtgate/planbuilder/route_planning.go @@ -461,25 +461,27 @@ func pushJoinPredicateOnJoin(ctx *planningContext, exprs []sqlparser.Expr, node node = node.clone().(*joinTree) var rhsPreds []sqlparser.Expr + var lhsPreds []sqlparser.Expr var lhsColumns []*sqlparser.ColName var lhsVarsName []string for _, expr := range exprs { - // we are pushing argument expression in a different way, if one side - // of the comparison is an argument (*sqlparser.Argument) coming from - // then we can push the expression to either left or right hand side - // (depending on who solves the expression). such expression do not - // need to be "outputed" and sent to the RHS of the join as we would - // usually do. - newNode, err := pushArgumentsOnJoin(ctx, expr, node) - if err != nil { - return nil, err - } - if newNode != nil { - // we are getting a new node from pushArgumentsOnJoin, meaning - // we do not need to break the predicate between LHS and RHS, thus we - // continue onto the following expression. - node = newNode + // We find the dependencies for the given expression and if they are solved entirely by one + // side of the join tree, then we push the predicate there and do not break it into parts. + // In case a predicate has no dependencies, then it is pushed to both sides so that we can filter + // rows as early as possible making join cheaper on the vtgate level. + depsForExpr := ctx.semTable.RecursiveDeps(expr) + singleSideDeps := false + if depsForExpr.IsSolvedBy(node.lhs.tableID()) { + lhsPreds = append(lhsPreds, expr) + singleSideDeps = true + } + if depsForExpr.IsSolvedBy(node.rhs.tableID()) { + rhsPreds = append(rhsPreds, expr) + singleSideDeps = true + } + + if singleSideDeps { continue } @@ -501,68 +503,23 @@ func pushJoinPredicateOnJoin(ctx *planningContext, exprs []sqlparser.Expr, node node.vars[lhsVarsName[i]] = idx } } + lhsPlan, err := pushJoinPredicate(ctx, lhsPreds, node.lhs) + if err != nil { + return nil, err + } rhsPlan, err := pushJoinPredicate(ctx, rhsPreds, node.rhs) if err != nil { return nil, err } return &joinTree{ - lhs: node.lhs, + lhs: lhsPlan, rhs: rhsPlan, outer: node.outer, vars: node.vars, }, nil } -func pushArgumentsOnJoin(ctx *planningContext, expr sqlparser.Expr, node *joinTree) (*joinTree, error) { - cmp, isCmp := expr.(*sqlparser.ComparisonExpr) - if !isCmp { - return nil, nil - } - - solvedByLeft, solvedByRight := isComparisonExprSolvedByJoinTree(ctx, cmp, node) - if !solvedByLeft && !solvedByRight { - return nil, nil - } - - var nodeToReplace queryTree - if solvedByLeft { - nodeToReplace = node.lhs - } else if solvedByRight { - nodeToReplace = node.rhs - } - - newNode, err := pushJoinPredicate(ctx, []sqlparser.Expr{expr}, nodeToReplace) - if err != nil { - return nil, err - } - - if solvedByLeft { - node.lhs = newNode - } else if solvedByRight { - node.rhs = newNode - } - return node, nil -} - -func isComparisonExprSolvedByJoinTree(ctx *planningContext, cmp *sqlparser.ComparisonExpr, node *joinTree) (bool, bool) { - var argExpr sqlparser.Expr - _, isLeftArg := cmp.Left.(sqlparser.Argument) - _, isRightArg := cmp.Right.(sqlparser.Argument) - if isLeftArg { - argExpr = cmp.Right - } else if isRightArg { - argExpr = cmp.Left - } else { - return false, false - } - - argDeps := ctx.semTable.RecursiveDeps(argExpr) - solvedByLeft := argDeps.IsSolvedBy(node.lhs.tableID()) - solvedByRight := argDeps.IsSolvedBy(node.rhs.tableID()) - return solvedByLeft, solvedByRight -} - func breakPredicateInLHSandRHS( expr sqlparser.Expr, semTable *semantics.SemTable, From 65860299dc4141c47cf84a1912afe81a7243caa7 Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Thu, 16 Sep 2021 08:42:03 +0200 Subject: [PATCH 09/10] Reverted cached_size import changes Signed-off-by: Florent Poinsard --- go/tools/sizegen/integration/cached_size.go | 1 - go/vt/vtgate/engine/cached_size.go | 1 - go/vt/vtgate/vindexes/cached_size.go | 1 - 3 files changed, 3 deletions(-) diff --git a/go/tools/sizegen/integration/cached_size.go b/go/tools/sizegen/integration/cached_size.go index 6023b29b7e4..a841d94f88b 100644 --- a/go/tools/sizegen/integration/cached_size.go +++ b/go/tools/sizegen/integration/cached_size.go @@ -21,7 +21,6 @@ import ( "math" "reflect" "unsafe" - hack "vitess.io/vitess/go/hack" ) diff --git a/go/vt/vtgate/engine/cached_size.go b/go/vt/vtgate/engine/cached_size.go index a1db2e3f185..380328449b5 100644 --- a/go/vt/vtgate/engine/cached_size.go +++ b/go/vt/vtgate/engine/cached_size.go @@ -21,7 +21,6 @@ import ( "math" "reflect" "unsafe" - hack "vitess.io/vitess/go/hack" ) diff --git a/go/vt/vtgate/vindexes/cached_size.go b/go/vt/vtgate/vindexes/cached_size.go index 10af44ae6b2..a22932e6155 100644 --- a/go/vt/vtgate/vindexes/cached_size.go +++ b/go/vt/vtgate/vindexes/cached_size.go @@ -21,7 +21,6 @@ import ( "math" "reflect" "unsafe" - hack "vitess.io/vitess/go/hack" ) From a837c83149d5f5542b1a6f8f1dd140420b578459 Mon Sep 17 00:00:00 2001 From: Florent Poinsard Date: Thu, 16 Sep 2021 09:18:05 +0200 Subject: [PATCH 10/10] Error instead of panic in pushJoinPredicate Signed-off-by: Florent Poinsard --- go/vt/vtgate/planbuilder/route_planning.go | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/go/vt/vtgate/planbuilder/route_planning.go b/go/vt/vtgate/planbuilder/route_planning.go index cf56ac11929..427fa64b958 100644 --- a/go/vt/vtgate/planbuilder/route_planning.go +++ b/go/vt/vtgate/planbuilder/route_planning.go @@ -17,7 +17,6 @@ limitations under the License. package planbuilder import ( - "fmt" "io" "sort" @@ -419,7 +418,7 @@ func pushJoinPredicate(ctx *planningContext, exprs []sqlparser.Expr, tree queryT // vindexFunc cannot accept predicates from the other side of a join return node, nil default: - panic(fmt.Sprintf("BUG: unknown type %T", node)) + return nil, vterrors.Errorf(vtrpcpb.Code_INTERNAL, "BUG: unknown type %T", node) } }