From add388758e57587624f3301b7be339777bdd28aa Mon Sep 17 00:00:00 2001 From: wangweicugw <38103831+wangweicugw@users.noreply.github.com> Date: Mon, 1 Apr 2024 21:44:55 +0800 Subject: [PATCH] Optimize with IN Clause for UPDATE/DELETE Statements on Vindexes (#15455) --- .../queries/benchmark/benchmark_test.go | 68 +++++++++++++++++++ .../endtoend/vtgate/queries/dml/dml_test.go | 51 +++++++++++++- go/vt/vtgate/autocommit_test.go | 9 ++- go/vt/vtgate/engine/delete.go | 4 +- go/vt/vtgate/engine/delete_test.go | 35 +++++++++- go/vt/vtgate/engine/dml.go | 5 +- go/vt/vtgate/engine/dml_with_input_test.go | 4 +- go/vt/vtgate/engine/update.go | 4 +- go/vt/vtgate/engine/update_test.go | 47 +++++++++++-- go/vt/vtgate/executor_dml_test.go | 14 ++-- .../planbuilder/operator_transformers.go | 14 ++-- .../planbuilder/testdata/dml_cases.json | 24 +++---- 12 files changed, 235 insertions(+), 44 deletions(-) diff --git a/go/test/endtoend/vtgate/queries/benchmark/benchmark_test.go b/go/test/endtoend/vtgate/queries/benchmark/benchmark_test.go index 5ebb8c5e422..9a064c1769a 100644 --- a/go/test/endtoend/vtgate/queries/benchmark/benchmark_test.go +++ b/go/test/endtoend/vtgate/queries/benchmark/benchmark_test.go @@ -48,6 +48,33 @@ func (tq *testQuery) getInsertQuery(rows int) string { return fmt.Sprintf("insert into %s(%s) values %s", tq.tableName, strings.Join(tq.cols, ","), strings.Join(allRows, ",")) } +func (tq *testQuery) getUpdateQuery(rows int) string { + var allRows []string + var row []string + for i, isInt := range tq.intTyp { + if isInt { + row = append(row, strconv.Itoa(i)) + continue + } + row = append(row, tq.cols[i]+" = '"+getRandomString(50)+"'") + } + allRows = append(allRows, strings.Join(row, ",")) + + var ids []string + for i := 0; i <= rows; i++ { + ids = append(ids, strconv.Itoa(i)) + } + return fmt.Sprintf("update %s set %s where id in (%s)", tq.tableName, strings.Join(allRows, ","), strings.Join(ids, ",")) +} + +func (tq *testQuery) getDeleteQuery(rows int) string { + var ids []string + for i := 0; i <= rows; i++ { + ids = append(ids, strconv.Itoa(i)) + } + return fmt.Sprintf("delete from %s where id in (%s)", tq.tableName, strings.Join(ids, ",")) +} + func getRandomString(size int) string { var str strings.Builder @@ -78,3 +105,44 @@ func BenchmarkShardedTblNoLookup(b *testing.B) { }) } } + +func BenchmarkShardedTblUpdateIn(b *testing.B) { + conn, closer := start(b) + defer closer() + + cols := []string{"c1", "c2", "c3", "c4", "c5", "c6", "c7", "c8", "c9", "c10", "c11", "c12"} + intType := make([]bool, len(cols)) + tq := &testQuery{ + tableName: "tbl_no_lkp_vdx", + cols: cols, + intTyp: intType, + } + insStmt := tq.getInsertQuery(10000) + _ = utils.Exec(b, conn, insStmt) + for _, rows := range []int{1, 10, 100, 500, 1000, 5000, 10000} { + updStmt := tq.getUpdateQuery(rows) + b.Run(fmt.Sprintf("16-shards-%d-rows", rows), func(b *testing.B) { + for i := 0; i < b.N; i++ { + _ = utils.Exec(b, conn, updStmt) + } + }) + } +} + +func BenchmarkShardedTblDeleteIn(b *testing.B) { + conn, closer := start(b) + defer closer() + tq := &testQuery{ + tableName: "tbl_no_lkp_vdx", + } + for _, rows := range []int{1, 10, 100, 500, 1000, 5000, 10000} { + insStmt := tq.getInsertQuery(rows) + _ = utils.Exec(b, conn, insStmt) + delStmt := tq.getDeleteQuery(rows) + b.Run(fmt.Sprintf("16-shards-%d-rows", rows), func(b *testing.B) { + for i := 0; i < b.N; i++ { + _ = utils.Exec(b, conn, delStmt) + } + }) + } +} diff --git a/go/test/endtoend/vtgate/queries/dml/dml_test.go b/go/test/endtoend/vtgate/queries/dml/dml_test.go index 98db03bee0c..3841a05fcdb 100644 --- a/go/test/endtoend/vtgate/queries/dml/dml_test.go +++ b/go/test/endtoend/vtgate/queries/dml/dml_test.go @@ -19,10 +19,12 @@ package dml import ( "testing" + "vitess.io/vitess/go/mysql" + "vitess.io/vitess/go/sqltypes" + "vitess.io/vitess/go/test/endtoend/utils" + "github.com/stretchr/testify/assert" "github.com/stretchr/testify/require" - - "vitess.io/vitess/go/test/endtoend/utils" ) func TestMultiEqual(t *testing.T) { @@ -363,3 +365,48 @@ func TestMultiTargetUpdate(t *testing.T) { mcmp.AssertMatches(`select oid, ename from oevent_tbl order by oid`, `[[INT64(1) VARCHAR("a")] [INT64(2) VARCHAR("xyz")] [INT64(3) VARCHAR("a")] [INT64(4) VARCHAR("a")]]`) } + +// TestDMLInUnique for update/delete statement using an IN clause with the Vindexes, +// the query is correctly split according to the corresponding values in the IN list. +func TestDMLInUnique(t *testing.T) { + utils.SkipIfBinaryIsBelowVersion(t, 20, "vtgate") + + mcmp, closer := start(t) + defer closer() + + // initial rows + mcmp.Exec("insert into user_tbl(id, region_id, `name`) values (1,1,'a'),(2,2,'a'),(3,3,'a'),(4,4,'a'),(5,5,'a'),(6,6,'a')") + + qr := mcmp.Exec("update user_tbl set `name` = 'b' where region_id in (1,2,3,4,5,6)") + assert.EqualValues(t, 6, qr.RowsAffected) + qr = mcmp.Exec("delete from user_tbl where region_id in (1,2,3,4,5,6)") + assert.EqualValues(t, 6, qr.RowsAffected) + mcmp.Exec("insert into user_tbl(id, region_id, `name`) values (1,1,'a'),(2,2,'a'),(3,3,'a'),(4,4,'a'),(5,5,'a'),(6,6,'a')") + + assertVExplainEquals := func(t *testing.T, conn *mysql.Conn, query, expected string) { + t.Helper() + qr := utils.Exec(t, conn, query) + // strip the first column from each row as it is not deterministic in a VExplain query + for i := range qr.Rows { + qr.Rows[i] = qr.Rows[i][1:] + } + if err := sqltypes.RowsEqualsStr(expected, qr.Rows); err != nil { + t.Error(err) + } + } + expected := `[ + [VARCHAR("sks") VARCHAR("-80") VARCHAR("begin")] + [VARCHAR("sks") VARCHAR("-80") VARCHAR("update user_tbl set ` + "`name`" + ` = 'b' where region_id in (1, 2, 3, 5)")] + [VARCHAR("sks") VARCHAR("80-") VARCHAR("begin")] + [VARCHAR("sks") VARCHAR("80-") VARCHAR("update user_tbl set ` + "`name`" + ` = 'b' where region_id in (4, 6)")] + ]` + assertVExplainEquals(t, mcmp.VtConn, "vexplain /*vt+ EXECUTE_DML_QUERIES */ queries update user_tbl set `name` = 'b' where region_id in (1,2,3,4,5,6)", expected) + + expected = `[ + [VARCHAR("sks") VARCHAR("-80") VARCHAR("begin")] + [VARCHAR("sks") VARCHAR("-80") VARCHAR("delete from user_tbl where region_id in (1, 2, 3, 5)")] + [VARCHAR("sks") VARCHAR("80-") VARCHAR("begin")] + [VARCHAR("sks") VARCHAR("80-") VARCHAR("delete from user_tbl where region_id in (4, 6)")] + ]` + assertVExplainEquals(t, mcmp.VtConn, "vexplain /*vt+ EXECUTE_DML_QUERIES */ queries delete from user_tbl where region_id in (1,2,3,4,5,6)", expected) +} diff --git a/go/vt/vtgate/autocommit_test.go b/go/vt/vtgate/autocommit_test.go index fa63695bfbd..1ba99c01ef2 100644 --- a/go/vt/vtgate/autocommit_test.go +++ b/go/vt/vtgate/autocommit_test.go @@ -185,8 +185,10 @@ func TestAutocommitDeleteIn(t *testing.T) { require.NoError(t, err) assertQueries(t, sbc1, []*querypb.BoundQuery{{ - Sql: "delete from user_extra where user_id in (1, 2)", - BindVariables: map[string]*querypb.BindVariable{}, + Sql: "delete from user_extra where user_id in ::__vals", + BindVariables: map[string]*querypb.BindVariable{ + "__vals": sqltypes.TestBindVariable([]any{int64(1), int64(2)}), + }, }}) testCommitCount(t, "sbc1", sbc1, 0) @@ -391,11 +393,12 @@ func TestAutocommitTransactionStarted(t *testing.T) { // multi shard query - savepoint needed sql = "update `user` set a = 2 where id in (1, 4)" + expectedSql := "update `user` set a = 2 where id in ::__vals" _, err = executor.Execute(context.Background(), nil, "TestExecute", NewSafeSession(session), sql, map[string]*querypb.BindVariable{}) require.NoError(t, err) require.Len(t, sbc1.Queries, 2) require.Contains(t, sbc1.Queries[0].Sql, "savepoint") - require.Equal(t, sql, sbc1.Queries[1].Sql) + require.Equal(t, expectedSql, sbc1.Queries[1].Sql) testCommitCount(t, "sbc1", sbc1, 0) } diff --git a/go/vt/vtgate/engine/delete.go b/go/vt/vtgate/engine/delete.go index adcc11174fd..6e354aae5f5 100644 --- a/go/vt/vtgate/engine/delete.go +++ b/go/vt/vtgate/engine/delete.go @@ -45,7 +45,7 @@ func (del *Delete) TryExecute(ctx context.Context, vcursor VCursor, bindVars map ctx, cancelFunc := addQueryTimeout(ctx, vcursor, del.QueryTimeout) defer cancelFunc() - rss, _, err := del.findRoute(ctx, vcursor, bindVars) + rss, bvs, err := del.findRoute(ctx, vcursor, bindVars) if err != nil { return nil, err } @@ -58,7 +58,7 @@ func (del *Delete) TryExecute(ctx context.Context, vcursor VCursor, bindVars map case Unsharded: return del.execUnsharded(ctx, del, vcursor, bindVars, rss) case Equal, IN, Scatter, ByDestination, SubShard, EqualUnique, MultiEqual: - return del.execMultiDestination(ctx, del, vcursor, bindVars, rss, del.deleteVindexEntries) + return del.execMultiDestination(ctx, del, vcursor, bindVars, rss, del.deleteVindexEntries, bvs) default: // Unreachable. return nil, fmt.Errorf("unsupported opcode: %v", del.Opcode) diff --git a/go/vt/vtgate/engine/delete_test.go b/go/vt/vtgate/engine/delete_test.go index d8485765ca9..18dcef5cbe4 100644 --- a/go/vt/vtgate/engine/delete_test.go +++ b/go/vt/vtgate/engine/delete_test.go @@ -544,7 +544,7 @@ func TestDeleteInChangedVindexMultiCol(t *testing.T) { `Execute delete from lkp_rg_tbl where from = :from and toc = :toc from: type:INT64 value:"6" toc: type:VARBINARY value:"\x01N\xb1\x90ɢ\xfa\x16\x9c" true`, `Execute delete from lkp_rg_tbl where from = :from and toc = :toc from: type:INT64 value:"7" toc: type:VARBINARY value:"\x02N\xb1\x90ɢ\xfa\x16\x9c" true`, // Finally, the actual delete, which is also sent to -20, same route as the subquery. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals0: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"}} true true`, }) } @@ -611,3 +611,36 @@ func TestDeleteMultiEqual(t *testing.T) { `ExecuteMultiShard sharded.-20: dummy_delete {} sharded.20-: dummy_delete {} true false`, }) } + +// TestDeleteInUnique is a test function for delete statement using an IN clause with the Vindexes, +// the query is correctly split according to the corresponding values in the IN list. +func TestDeleteInUnique(t *testing.T) { + ks := buildTestVSchema().Keyspaces["sharded"] + upd := &Delete{ + DML: &DML{ + RoutingParameters: &RoutingParameters{ + Opcode: IN, + Keyspace: ks.Keyspace, + Vindex: ks.Vindexes["hash"], + Values: []evalengine.Expr{evalengine.TupleExpr{ + evalengine.NewLiteralInt(1), + evalengine.NewLiteralInt(2), + evalengine.NewLiteralInt(4), + }}}, + Query: "delete t where id in ::__vals", + }, + } + + tupleBV := &querypb.BindVariable{ + Type: querypb.Type_TUPLE, + Values: append([]*querypb.Value{sqltypes.ValueToProto(sqltypes.NewInt64(1))}, sqltypes.ValueToProto(sqltypes.NewInt64(2)), sqltypes.ValueToProto(sqltypes.NewInt64(4))), + } + vc := newDMLTestVCursor("-20", "20-") + vc.shardForKsid = []string{"-20", "20-"} + _, err := upd.TryExecute(context.Background(), vc, map[string]*querypb.BindVariable{"__vals": tupleBV}, false) + require.NoError(t, err) + vc.ExpectLog(t, []string{ + `ResolveDestinations sharded [type:INT64 value:"1" type:INT64 value:"2" type:INT64 value:"4"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f),DestinationKeyspaceID(d2fd8867d50d2dfe)`, + `ExecuteMultiShard sharded.-20: delete t where id in ::__vals {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"4"}} sharded.20-: delete t where id in ::__vals {__vals: type:TUPLE values:{type:INT64 value:"2"}} true false`, + }) +} diff --git a/go/vt/vtgate/engine/dml.go b/go/vt/vtgate/engine/dml.go index 463008a4433..db777c36698 100644 --- a/go/vt/vtgate/engine/dml.go +++ b/go/vt/vtgate/engine/dml.go @@ -78,7 +78,8 @@ func (dml *DML) execUnsharded(ctx context.Context, primitive Primitive, vcursor return execShard(ctx, primitive, vcursor, dml.Query, bindVars, rss[0], true /* rollbackOnError */, !dml.PreventAutoCommit /* canAutocommit */) } -func (dml *DML) execMultiDestination(ctx context.Context, primitive Primitive, vcursor VCursor, bindVars map[string]*querypb.BindVariable, rss []*srvtopo.ResolvedShard, dmlSpecialFunc func(context.Context, VCursor, map[string]*querypb.BindVariable, []*srvtopo.ResolvedShard) error) (*sqltypes.Result, error) { +func (dml *DML) execMultiDestination(ctx context.Context, primitive Primitive, vcursor VCursor, bindVars map[string]*querypb.BindVariable, rss []*srvtopo.ResolvedShard, dmlSpecialFunc func(context.Context, VCursor, + map[string]*querypb.BindVariable, []*srvtopo.ResolvedShard) error, bvs []map[string]*querypb.BindVariable) (*sqltypes.Result, error) { if len(rss) == 0 { return &sqltypes.Result{}, nil } @@ -90,7 +91,7 @@ func (dml *DML) execMultiDestination(ctx context.Context, primitive Primitive, v for i := range rss { queries[i] = &querypb.BoundQuery{ Sql: dml.Query, - BindVariables: bindVars, + BindVariables: bvs[i], } } return execMultiShard(ctx, primitive, vcursor, rss, queries, dml.MultiShardAutocommit) diff --git a/go/vt/vtgate/engine/dml_with_input_test.go b/go/vt/vtgate/engine/dml_with_input_test.go index e43bc2b151f..b41dc9e148c 100644 --- a/go/vt/vtgate/engine/dml_with_input_test.go +++ b/go/vt/vtgate/engine/dml_with_input_test.go @@ -164,7 +164,7 @@ func TestDeleteWithMultiTarget(t *testing.T) { require.NoError(t, err) vc.ExpectLog(t, []string{ `ResolveDestinations ks [type:INT64 value:"1" type:INT64 value:"2" type:INT64 value:"3"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f),DestinationKeyspaceID(4eb190c9a2fa169c)`, - `ExecuteMultiShard ks.-20: dummy_delete_1 {dml_vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"} values:{type:INT64 value:"3"}} true true`, + `ExecuteMultiShard ks.-20: dummy_delete_1 {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"} values:{type:INT64 value:"3"} dml_vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"} values:{type:INT64 value:"3"}} true true`, `ResolveDestinations ks [type:INT64 value:"1" type:INT64 value:"2" type:INT64 value:"3"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f),DestinationKeyspaceID(4eb190c9a2fa169c)`, `ExecuteMultiShard ks.-20: dummy_delete_2 {dml_vals: type:TUPLE values:{type:TUPLE value:"\x89\x02\x03100\x89\x02\x011"} values:{type:TUPLE value:"\x89\x02\x03100\x89\x02\x012"} values:{type:TUPLE value:"\x89\x02\x03200\x89\x02\x013"}} true true`, }) @@ -175,7 +175,7 @@ func TestDeleteWithMultiTarget(t *testing.T) { require.NoError(t, err) vc.ExpectLog(t, []string{ `ResolveDestinations ks [type:INT64 value:"1" type:INT64 value:"2" type:INT64 value:"3"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f),DestinationKeyspaceID(4eb190c9a2fa169c)`, - `ExecuteMultiShard ks.-20: dummy_delete_1 {dml_vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"} values:{type:INT64 value:"3"}} true true`, + `ExecuteMultiShard ks.-20: dummy_delete_1 {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"} values:{type:INT64 value:"3"} dml_vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"} values:{type:INT64 value:"3"}} true true`, `ResolveDestinations ks [type:INT64 value:"1" type:INT64 value:"2" type:INT64 value:"3"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f),DestinationKeyspaceID(4eb190c9a2fa169c)`, `ExecuteMultiShard ks.-20: dummy_delete_2 {dml_vals: type:TUPLE values:{type:TUPLE value:"\x89\x02\x03100\x89\x02\x011"} values:{type:TUPLE value:"\x89\x02\x03100\x89\x02\x012"} values:{type:TUPLE value:"\x89\x02\x03200\x89\x02\x013"}} true true`, }) diff --git a/go/vt/vtgate/engine/update.go b/go/vt/vtgate/engine/update.go index 323b7ab40ac..13c590bbb63 100644 --- a/go/vt/vtgate/engine/update.go +++ b/go/vt/vtgate/engine/update.go @@ -56,7 +56,7 @@ func (upd *Update) TryExecute(ctx context.Context, vcursor VCursor, bindVars map ctx, cancelFunc := addQueryTimeout(ctx, vcursor, upd.QueryTimeout) defer cancelFunc() - rss, _, err := upd.findRoute(ctx, vcursor, bindVars) + rss, bvs, err := upd.findRoute(ctx, vcursor, bindVars) if err != nil { return nil, err } @@ -69,7 +69,7 @@ func (upd *Update) TryExecute(ctx context.Context, vcursor VCursor, bindVars map case Unsharded: return upd.execUnsharded(ctx, upd, vcursor, bindVars, rss) case Equal, EqualUnique, IN, Scatter, ByDestination, SubShard, MultiEqual: - return upd.execMultiDestination(ctx, upd, vcursor, bindVars, rss, upd.updateVindexEntries) + return upd.execMultiDestination(ctx, upd, vcursor, bindVars, rss, upd.updateVindexEntries, bvs) default: // Unreachable. return nil, fmt.Errorf("unsupported opcode: %v", upd.Opcode) diff --git a/go/vt/vtgate/engine/update_test.go b/go/vt/vtgate/engine/update_test.go index 9d583cdcfcf..eab2742fc15 100644 --- a/go/vt/vtgate/engine/update_test.go +++ b/go/vt/vtgate/engine/update_test.go @@ -638,7 +638,7 @@ func TestUpdateIn(t *testing.T) { vc.ExpectLog(t, []string{ `ResolveDestinations sharded [type:INT64 value:"1" type:INT64 value:"2"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f)`, // ResolveDestinations is hard-coded to return -20. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"}} true true`, }) } @@ -664,7 +664,7 @@ func TestUpdateInStreamExecute(t *testing.T) { vc.ExpectLog(t, []string{ `ResolveDestinations sharded [type:INT64 value:"1" type:INT64 value:"2"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f)`, // ResolveDestinations is hard-coded to return -20. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"}} true true`, }) } @@ -689,7 +689,7 @@ func TestUpdateInMultiCol(t *testing.T) { vc.ExpectLog(t, []string{ `ResolveDestinationsMultiCol sharded [[INT64(1) INT64(3)] [INT64(1) INT64(4)] [INT64(2) INT64(3)] [INT64(2) INT64(4)]] Destinations:DestinationKeyspaceID(014eb190c9a2fa169c),DestinationKeyspaceID(01d2fd8867d50d2dfe),DestinationKeyspaceID(024eb190c9a2fa169c),DestinationKeyspaceID(02d2fd8867d50d2dfe)`, // ResolveDestinations is hard-coded to return -20. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals0: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"} __vals1: type:TUPLE values:{type:INT64 value:"3"} values:{type:INT64 value:"4"}} true true`, }) } @@ -762,7 +762,7 @@ func TestUpdateInChangedVindex(t *testing.T) { `Execute delete from lkp1 where from = :from and toc = :toc from: type:INT64 value:"23" toc: type:VARBINARY value:"\x06\xe7\xea\"Βp\x8f" true`, `Execute insert into lkp1(from, toc) values(:from_0, :toc_0) from_0: type:INT64 value:"3" toc_0: type:VARBINARY value:"\x06\xe7\xea\"Βp\x8f" true`, // Finally, the actual update, which is also sent to -20, same route as the subquery. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"}} true true`, }) // No rows changing @@ -776,7 +776,7 @@ func TestUpdateInChangedVindex(t *testing.T) { // It gets used to perform the subquery to fetch the changing column values. `ExecuteMultiShard sharded.-20: dummy_subquery {} false false`, // Subquery returns no rows. So, no vindexes are updated. We still pass-through the original update. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"}} true true`, }) // multiple rows changing. @@ -819,7 +819,7 @@ func TestUpdateInChangedVindex(t *testing.T) { `Execute delete from lkp1 where from = :from and toc = :toc from: type:INT64 value:"23" toc: type:VARBINARY value:"\x06\xe7\xea\"Βp\x8f" true`, `Execute insert into lkp1(from, toc) values(:from_0, :toc_0) from_0: type:INT64 value:"3" toc_0: type:VARBINARY value:"\x06\xe7\xea\"Βp\x8f" true`, // Finally, the actual update, which is also sent to -20, same route as the subquery. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"}} true true`, }) } @@ -881,7 +881,7 @@ func TestUpdateInChangedVindexMultiCol(t *testing.T) { `Execute delete from lkp_rg_tbl where from = :from and toc = :toc from: type:INT64 value:"7" toc: type:VARBINARY value:"\x02N\xb1\x90ɢ\xfa\x16\x9c" true`, `Execute insert into lkp_rg_tbl(from, toc) values(:from_0, :toc_0) from_0: type:INT64 value:"5" toc_0: type:VARBINARY value:"\x02N\xb1\x90ɢ\xfa\x16\x9c" true`, // Finally, the actual update, which is also sent to -20, same route as the subquery. - `ExecuteMultiShard sharded.-20: dummy_update {} true true`, + `ExecuteMultiShard sharded.-20: dummy_update {__vals0: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"2"}} true true`, }) } @@ -949,6 +949,39 @@ func TestUpdateMultiEqual(t *testing.T) { }) } +// TestUpdateInUnique is a test function for update statement using an IN clause with the Vindexes, +// the query is correctly split according to the corresponding values in the IN list. +func TestUpdateInUnique(t *testing.T) { + ks := buildTestVSchema().Keyspaces["sharded"] + upd := &Update{ + DML: &DML{ + RoutingParameters: &RoutingParameters{ + Opcode: IN, + Keyspace: ks.Keyspace, + Vindex: ks.Vindexes["hash"], + Values: []evalengine.Expr{evalengine.TupleExpr{ + evalengine.NewLiteralInt(1), + evalengine.NewLiteralInt(2), + evalengine.NewLiteralInt(4), + }}}, + Query: "update t set n = 'b' where id in ::__vals", + }, + } + + tupleBV := &querypb.BindVariable{ + Type: querypb.Type_TUPLE, + Values: append([]*querypb.Value{sqltypes.ValueToProto(sqltypes.NewInt64(1))}, sqltypes.ValueToProto(sqltypes.NewInt64(2)), sqltypes.ValueToProto(sqltypes.NewInt64(4))), + } + vc := newDMLTestVCursor("-20", "20-") + vc.shardForKsid = []string{"-20", "20-"} + _, err := upd.TryExecute(context.Background(), vc, map[string]*querypb.BindVariable{"__vals": tupleBV}, false) + require.NoError(t, err) + vc.ExpectLog(t, []string{ + `ResolveDestinations sharded [type:INT64 value:"1" type:INT64 value:"2" type:INT64 value:"4"] Destinations:DestinationKeyspaceID(166b40b44aba4bd6),DestinationKeyspaceID(06e7ea22ce92708f),DestinationKeyspaceID(d2fd8867d50d2dfe)`, + `ExecuteMultiShard sharded.-20: update t set n = 'b' where id in ::__vals {__vals: type:TUPLE values:{type:INT64 value:"1"} values:{type:INT64 value:"4"}} sharded.20-: update t set n = 'b' where id in ::__vals {__vals: type:TUPLE values:{type:INT64 value:"2"}} true false`, + }) +} + func buildTestVSchema() *vindexes.VSchema { invschema := &vschemapb.SrvVSchema{ Keyspaces: map[string]*vschemapb.Keyspace{ diff --git a/go/vt/vtgate/executor_dml_test.go b/go/vt/vtgate/executor_dml_test.go index b1d62966a43..3dce4e212ef 100644 --- a/go/vt/vtgate/executor_dml_test.go +++ b/go/vt/vtgate/executor_dml_test.go @@ -876,8 +876,10 @@ func TestUpdateUseHigherCostVindexIfBackfilling(t *testing.T) { Sql: "select id, wo_lu_col, erl_lu_col, srl_lu_col, nrl_lu_col, nv_lu_col, lu_col, lu_col = 5 from t2_lookup where wo_lu_col = 2 and lu_col in (1, 2) for update", BindVariables: map[string]*querypb.BindVariable{}, }, { - Sql: "update t2_lookup set lu_col = 5 where wo_lu_col = 2 and lu_col in (1, 2)", - BindVariables: map[string]*querypb.BindVariable{}, + Sql: "update t2_lookup set lu_col = 5 where wo_lu_col = 2 and lu_col in ::__vals", + BindVariables: map[string]*querypb.BindVariable{ + "__vals": sqltypes.TestBindVariable([]any{int64(1), int64(2)}), + }, }} vars, _ := sqltypes.BuildBindVariable([]any{ @@ -1109,8 +1111,10 @@ func TestDeleteUseHigherCostVindexIfBackfilling(t *testing.T) { Sql: "select id, wo_lu_col, erl_lu_col, srl_lu_col, nrl_lu_col, nv_lu_col, lu_col from t2_lookup where wo_lu_col = 1 and lu_col in (1, 2) for update", BindVariables: map[string]*querypb.BindVariable{}, }, { - Sql: "delete from t2_lookup where wo_lu_col = 1 and lu_col in (1, 2)", - BindVariables: map[string]*querypb.BindVariable{}, + Sql: "delete from t2_lookup where wo_lu_col = 1 and lu_col in ::__vals", + BindVariables: map[string]*querypb.BindVariable{ + "__vals": sqltypes.TestBindVariable([]any{int64(1), int64(2)}), + }, }} vars, _ := sqltypes.BuildBindVariable([]any{ @@ -3107,7 +3111,7 @@ func TestDeleteMultiTable(t *testing.T) { {Sql: "select `user`.id, `user`.col from `user`", BindVariables: map[string]*querypb.BindVariable{}}, bq, bq, bq, bq, bq, bq, bq, bq, {Sql: "select `user`.Id, `user`.`name` from `user` where `user`.id in ::dml_vals for update", BindVariables: map[string]*querypb.BindVariable{"dml_vals": {Type: querypb.Type_TUPLE, Values: dmlVals}}}, - {Sql: "delete from `user` where `user`.id in ::dml_vals", BindVariables: map[string]*querypb.BindVariable{"dml_vals": {Type: querypb.Type_TUPLE, Values: dmlVals}}}} + {Sql: "delete from `user` where `user`.id in ::dml_vals", BindVariables: map[string]*querypb.BindVariable{"__vals": sqltypes.TestBindVariable([]any{int64(1), int64(1), int64(1), int64(1), int64(1), int64(1), int64(1), int64(1)}), "dml_vals": {Type: querypb.Type_TUPLE, Values: dmlVals}}}} assertQueries(t, sbc1, wantQueries) wantQueries = []*querypb.BoundQuery{ diff --git a/go/vt/vtgate/planbuilder/operator_transformers.go b/go/vt/vtgate/planbuilder/operator_transformers.go index f0783a5ecfb..572afa42f72 100644 --- a/go/vt/vtgate/planbuilder/operator_transformers.go +++ b/go/vt/vtgate/planbuilder/operator_transformers.go @@ -562,7 +562,7 @@ func transformRoutePlan(ctx *plancontext.PlanningContext, op *operators.Route) ( } func buildRouteLogicalPlan(ctx *plancontext.PlanningContext, op *operators.Route, stmt sqlparser.SelectStatement, hints *queryHints) (logicalPlan, error) { - _ = updateSelectedVindexPredicate(op) + _ = updateSelectedVindexPredicate(op.Routing) eroute, err := routeToEngineRoute(ctx, op, hints) for _, order := range op.Ordering { @@ -705,7 +705,7 @@ func buildUpdateLogicalPlan( if upd.VerifyAll { stmt.SetComments(stmt.GetParsedComments().SetMySQLSetVarValue(sysvars.ForeignKeyChecks, "OFF")) } - + _ = updateSelectedVindexPredicate(rb.Routing) edml := createDMLPrimitive(ctx, rb, hints, upd.Target.VTable, generateQuery(stmt), vindexes, vQuery) return &primitiveWrapper{prim: &engine.Update{ @@ -725,7 +725,7 @@ func buildDeleteLogicalPlan(ctx *plancontext.PlanningContext, rb *operators.Rout vQuery = sqlparser.String(del.OwnedVindexQuery) vindexes = del.Target.VTable.Owned } - + _ = updateSelectedVindexPredicate(rb.Routing) edml := createDMLPrimitive(ctx, rb, hints, del.Target.VTable, generateQuery(stmt), vindexes, vQuery) return &primitiveWrapper{prim: &engine.Delete{DML: edml}}, nil @@ -755,8 +755,8 @@ func createDMLPrimitive(ctx *plancontext.PlanningContext, rb *operators.Route, h return edml } -func updateSelectedVindexPredicate(op *operators.Route) sqlparser.Expr { - tr, ok := op.Routing.(*operators.ShardedRouting) +func updateSelectedVindexPredicate(routing operators.Routing) sqlparser.Expr { + tr, ok := routing.(*operators.ShardedRouting) if !ok || tr.Selected == nil { return nil } @@ -771,7 +771,9 @@ func updateSelectedVindexPredicate(op *operators.Route) sqlparser.Expr { if !ok { continue } - + if sqlparser.Equals.Expr(cmp.Right, sqlparser.ListArg(engine.DmlVals)) { + continue + } var argName string if isMultiColumn { argName = engine.ListVarName + strconv.Itoa(idx) diff --git a/go/vt/vtgate/planbuilder/testdata/dml_cases.json b/go/vt/vtgate/planbuilder/testdata/dml_cases.json index 0b77104ee4c..224c41d43eb 100644 --- a/go/vt/vtgate/planbuilder/testdata/dml_cases.json +++ b/go/vt/vtgate/planbuilder/testdata/dml_cases.json @@ -2157,7 +2157,7 @@ "Sharded": true }, "TargetTabletType": "PRIMARY", - "Query": "update user_extra set val = 1 where user_id in (1, 2)", + "Query": "update user_extra set val = 1 where user_id in ::__vals", "Table": "user_extra", "Values": [ "(1, 2)" @@ -2383,7 +2383,7 @@ "Sharded": true }, "TargetTabletType": "PRIMARY", - "Query": "delete from user_extra where user_id in (1, 2)", + "Query": "delete from user_extra where user_id in ::__vals", "Table": "user_extra", "Values": [ "(1, 2)" @@ -2516,7 +2516,7 @@ "KsidLength": 1, "KsidVindex": "user_index", "OwnedVindexQuery": "select Id, `Name`, Costly, `name` = null from `user` where id in (1, 2, 3) for update", - "Query": "update `user` set `name` = null where id in (1, 2, 3)", + "Query": "update `user` set `name` = null where id in ::__vals", "Table": "user", "Values": [ "(1, 2, 3)" @@ -2601,7 +2601,7 @@ "KsidLength": 1, "KsidVindex": "user_index", "OwnedVindexQuery": "select Id, `Name`, Costly from `user` where id in (1, 2, 3) for update", - "Query": "delete from `user` where id in (1, 2, 3)", + "Query": "delete from `user` where id in ::__vals", "Table": "user", "Values": [ "(1, 2, 3)" @@ -3101,7 +3101,7 @@ "KsidLength": 1, "KsidVindex": "xxhash", "OwnedVindexQuery": "select c1, c2, c3 from t1 where c2 = 10 and c3 in (20, 21) for update", - "Query": "delete from t1 where c2 = 10 and c3 in (20, 21)", + "Query": "delete from t1 where c2 = 10 and c3 in ::__vals", "Table": "t1", "Values": [ "(20, 21)" @@ -3133,7 +3133,7 @@ "KsidLength": 1, "KsidVindex": "xxhash", "OwnedVindexQuery": "select c1, c2, c3, c2 = 1 from t1 where c2 = 10 and c3 in (20, 21) for update", - "Query": "update t1 set c2 = 1 where c2 = 10 and c3 in (20, 21)", + "Query": "update t1 set c2 = 1 where c2 = 10 and c3 in ::__vals", "Table": "t1", "Values": [ "(20, 21)" @@ -3266,7 +3266,7 @@ "Sharded": true }, "TargetTabletType": "PRIMARY", - "Query": "update multicol_tbl set x = 1 where colb in (1, 2) and cola = 1", + "Query": "update multicol_tbl set x = 1 where colb in ::__vals1 and cola = 1", "Table": "multicol_tbl", "Values": [ "1", @@ -3293,7 +3293,7 @@ "Sharded": true }, "TargetTabletType": "PRIMARY", - "Query": "update multicol_tbl set x = 1 where colb in (1, 2) and cola in (3, 4)", + "Query": "update multicol_tbl set x = 1 where colb in ::__vals1 and cola in ::__vals0", "Table": "multicol_tbl", "Values": [ "(3, 4)", @@ -3383,7 +3383,7 @@ "KsidLength": 2, "KsidVindex": "multicolIdx", "OwnedVindexQuery": "select cola, colb, colc, `name` from multicol_tbl where colb in (1, 2) and cola = 1 for update", - "Query": "delete from multicol_tbl where colb in (1, 2) and cola = 1", + "Query": "delete from multicol_tbl where colb in ::__vals1 and cola = 1", "Table": "multicol_tbl", "Values": [ "1", @@ -3413,7 +3413,7 @@ "KsidLength": 2, "KsidVindex": "multicolIdx", "OwnedVindexQuery": "select cola, colb, colc, `name` from multicol_tbl where colb in (1, 2) and cola in (3, 4) for update", - "Query": "delete from multicol_tbl where colb in (1, 2) and cola in (3, 4)", + "Query": "delete from multicol_tbl where colb in ::__vals1 and cola in ::__vals0", "Table": "multicol_tbl", "Values": [ "(3, 4)", @@ -3563,7 +3563,7 @@ "KsidLength": 2, "KsidVindex": "multicolIdx", "OwnedVindexQuery": "select cola, colb, colc, `name`, `name` = 'bar' from multicol_tbl where cola in (1, 2) for update", - "Query": "update multicol_tbl set `name` = 'bar' where cola in (1, 2)", + "Query": "update multicol_tbl set `name` = 'bar' where cola in ::__vals0", "Table": "multicol_tbl", "Values": [ "(1, 2)" @@ -3676,7 +3676,7 @@ "KsidLength": 2, "KsidVindex": "multicolIdx", "OwnedVindexQuery": "select cola, colb, colc, `name` from multicol_tbl where cola in (1, 2) for update", - "Query": "delete from multicol_tbl where cola in (1, 2)", + "Query": "delete from multicol_tbl where cola in ::__vals0", "Table": "multicol_tbl", "Values": [ "(1, 2)"