From 96fb6af521c990d0808b556a5f94c431980b6b26 Mon Sep 17 00:00:00 2001 From: Harshit Gangal Date: Mon, 10 May 2021 17:09:51 +0530 Subject: [PATCH] Queryservice fix Backport of #8089 This is a combination of 3 commits. * remove precheck of tablet serving and target * remove the additional logic and return error if queryservice not found to serve query * fix test as per new change Signed-off-by: Harshit Gangal Signed-off-by: Andres Taylor --- go/vt/discovery/fake_healthcheck.go | 7 ------- go/vt/discovery/healthcheck.go | 8 -------- go/vt/vtgate/legacy_scatter_conn_test.go | 25 ++++++++++++----------- go/vt/vtgate/scatter_conn.go | 18 +--------------- go/vt/vtgate/scatter_conn_test.go | 16 +++++++++++---- go/vt/vttablet/sandboxconn/sandboxconn.go | 17 +++++++++++---- 6 files changed, 39 insertions(+), 52 deletions(-) diff --git a/go/vt/discovery/fake_healthcheck.go b/go/vt/discovery/fake_healthcheck.go index bbb1ec98baa..4407ae50ebc 100644 --- a/go/vt/discovery/fake_healthcheck.go +++ b/go/vt/discovery/fake_healthcheck.go @@ -150,13 +150,6 @@ func (fhc *FakeHealthCheck) TabletConnection(alias *topodatapb.TabletAlias, targ defer fhc.mu.RUnlock() for _, item := range fhc.items { if proto.Equal(alias, item.ts.Tablet.Alias) { - if !item.ts.Serving { - return nil, vterrors.Errorf(vtrpcpb.Code_FAILED_PRECONDITION, vterrors.NotServing) - } - if target != nil && !proto.Equal(item.ts.Target, target) { - return nil, vterrors.Errorf(vtrpcpb.Code_FAILED_PRECONDITION, "%s: target mismatch %v vs %v", vterrors.WrongTablet, item.ts.Target, target) - } - return item.ts.Conn, nil } } diff --git a/go/vt/discovery/healthcheck.go b/go/vt/discovery/healthcheck.go index b21cdac44a0..83a4048fe87 100644 --- a/go/vt/discovery/healthcheck.go +++ b/go/vt/discovery/healthcheck.go @@ -45,8 +45,6 @@ import ( "sync" "time" - "github.com/golang/protobuf/proto" - "vitess.io/vitess/go/flagutil" "vitess.io/vitess/go/stats" "vitess.io/vitess/go/vt/log" @@ -711,12 +709,6 @@ func (hc *HealthCheckImpl) TabletConnection(alias *topodata.TabletAlias, target //TODO: test that throws this error return nil, vterrors.Errorf(vtrpc.Code_NOT_FOUND, "tablet: %v is either down or nonexistent", alias) } - if !thc.Serving { - return nil, vterrors.Errorf(vtrpc.Code_FAILED_PRECONDITION, vterrors.NotServing) - } - if target != nil && !proto.Equal(thc.Target, target) { - return nil, vterrors.Errorf(vtrpc.Code_FAILED_PRECONDITION, "%s: target mismatch %v vs %v", vterrors.WrongTablet, thc.Target, target) - } return thc.Connection(), nil } diff --git a/go/vt/vtgate/legacy_scatter_conn_test.go b/go/vt/vtgate/legacy_scatter_conn_test.go index fa18f27bd17..4c48cd2bf04 100644 --- a/go/vt/vtgate/legacy_scatter_conn_test.go +++ b/go/vt/vtgate/legacy_scatter_conn_test.go @@ -17,28 +17,26 @@ limitations under the License. package vtgate import ( + "context" "fmt" "reflect" "strings" "testing" - "vitess.io/vitess/go/test/utils" - "github.com/stretchr/testify/assert" - - "context" - "github.com/stretchr/testify/require" "vitess.io/vitess/go/sqltypes" + "vitess.io/vitess/go/test/utils" "vitess.io/vitess/go/vt/discovery" "vitess.io/vitess/go/vt/key" + "vitess.io/vitess/go/vt/srvtopo" + "vitess.io/vitess/go/vt/vterrors" + querypb "vitess.io/vitess/go/vt/proto/query" topodatapb "vitess.io/vitess/go/vt/proto/topodata" vtgatepb "vitess.io/vitess/go/vt/proto/vtgate" vtrpcpb "vitess.io/vitess/go/vt/proto/vtrpc" - "vitess.io/vitess/go/vt/srvtopo" - "vitess.io/vitess/go/vt/vterrors" ) // This file uses the sandbox_test framework. @@ -387,15 +385,17 @@ func TestMultiExecs(t *testing.T) { rss := []*srvtopo.ResolvedShard{ { Target: &querypb.Target{ - Keyspace: "TestMultiExecs", - Shard: "0", + Keyspace: "TestMultiExecs", + Shard: "0", + TabletType: topodatapb.TabletType_REPLICA, }, Gateway: sbc0, }, { Target: &querypb.Target{ - Keyspace: "TestMultiExecs", - Shard: "1", + Keyspace: "TestMultiExecs", + Shard: "1", + TabletType: topodatapb.TabletType_REPLICA, }, Gateway: sbc1, }, @@ -415,7 +415,8 @@ func TestMultiExecs(t *testing.T) { }, } - _, _ = sc.ExecuteMultiShard(ctx, rss, queries, NewSafeSession(nil), false, false) + _, err := sc.ExecuteMultiShard(ctx, rss, queries, NewSafeSession(nil), false, false) + require.NoError(t, vterrors.Aggregate(err)) if len(sbc0.Queries) == 0 || len(sbc1.Queries) == 0 { t.Fatalf("didn't get expected query") } diff --git a/go/vt/vtgate/scatter_conn.go b/go/vt/vtgate/scatter_conn.go index ea8e27b26c9..1e4b0600241 100644 --- a/go/vt/vtgate/scatter_conn.go +++ b/go/vt/vtgate/scatter_conn.go @@ -221,23 +221,7 @@ func (stc *ScatterConn) ExecuteMultiShard( qs, err = getQueryService(rs, info) if err != nil { - // an error here could mean that the tablet we were targeting earlier has changed type. - // if we have a transaction, we'll have to fail, but if we only had a reserved connection, - // we can create a new reserved connection to a new tablet that is on the right shard - // and has the right type - switch info.actionNeeded { - case nothing: - info.actionNeeded = reserve - case begin: - info.actionNeeded = reserveBegin - default: - return nil, err - } - retry := checkAndResetShardSession(info, err, session) - if retry != newQS { - return nil, err - } - qs = rs.Gateway + return nil, err } retryRequest := func(exec func()) { diff --git a/go/vt/vtgate/scatter_conn_test.go b/go/vt/vtgate/scatter_conn_test.go index 4a5a8dcd8d5..ff1c4af62bc 100644 --- a/go/vt/vtgate/scatter_conn_test.go +++ b/go/vt/vtgate/scatter_conn_test.go @@ -351,12 +351,15 @@ func TestReservedConnFail(t *testing.T) { }) sbc0Th := ths[0] sbc0Th.Serving = false + sbc0.NotServing = true sbc0Rep := hc.AddTestTablet("aa", "0", 2, keyspace, "0", topodatapb.TabletType_REPLICA, true, 1, nil) sbc0.Queries = nil + sbc0.ExecCount.Set(0) _ = executeOnShardsReturnsErr(t, res, keyspace, sc, session, destinations) - assert.Equal(t, 0, len(sbc0.Queries), "no attempt should be made as the tablet is not serving") - assert.Equal(t, 1, len(sbc0Rep.Queries), "first attempt should pass as it is healthy") + assert.EqualValues(t, 1, sbc0.ExecCount.Get(), "first attempt should be made on original tablet") + assert.EqualValues(t, 0, len(sbc0.Queries), "no query should be executed on it") + assert.Equal(t, 1, len(sbc0Rep.Queries), "this attempt on new healthy tablet should pass") require.Equal(t, 1, len(session.ShardSessions)) assert.NotEqual(t, oldRId, session.Session.ShardSessions[0].ReservedId, "should have recreated a reserved connection since the last connection was lost") assert.NotEqual(t, oldAlias, session.Session.ShardSessions[0].TabletAlias, "tablet alias should have changed as this is a different tablet") @@ -376,12 +379,17 @@ func TestReservedConnFail(t *testing.T) { Shard: tablet0Rep.GetShard(), TabletType: topodatapb.TabletType_SPARE, } + sbc0Rep.Tablet().Type = topodatapb.TabletType_SPARE sbc0Th.Serving = true + sbc0.NotServing = false + sbc0.ExecCount.Set(0) sbc0Rep.Queries = nil + sbc0Rep.ExecCount.Set(0) _ = executeOnShardsReturnsErr(t, res, keyspace, sc, session, destinations) - assert.Equal(t, 1, len(sbc0.Queries), "first attempt should pass as it is healthy and matches the target") - assert.Equal(t, 0, len(sbc0Rep.Queries), " no attempt should be made as the tablet target is changed") + assert.EqualValues(t, 1, sbc0Rep.ExecCount.Get(), "first attempt should be made on the changed tablet type") + assert.EqualValues(t, 0, len(sbc0Rep.Queries), "no query should be executed on it") + assert.Equal(t, 1, len(sbc0.Queries), "this attempt should pass as it is on new healthy tablet and matches the target") require.Equal(t, 1, len(session.ShardSessions)) assert.NotEqual(t, oldRId, session.Session.ShardSessions[0].ReservedId, "should have recreated a reserved connection since the last connection was lost") assert.NotEqual(t, oldAlias, session.Session.ShardSessions[0].TabletAlias, "tablet alias should have changed as this is a different tablet") diff --git a/go/vt/vttablet/sandboxconn/sandboxconn.go b/go/vt/vttablet/sandboxconn/sandboxconn.go index 3fff1352aec..c0c7d740e27 100644 --- a/go/vt/vttablet/sandboxconn/sandboxconn.go +++ b/go/vt/vttablet/sandboxconn/sandboxconn.go @@ -114,6 +114,8 @@ type SandboxConn struct { // this error will only happen once EphemeralShardErr error + + NotServing bool } var _ queryservice.QueryService = (*SandboxConn)(nil) // compile-time interface check @@ -153,6 +155,12 @@ func (sbc *SandboxConn) Execute(ctx context.Context, target *querypb.Target, que sbc.execMu.Lock() defer sbc.execMu.Unlock() sbc.ExecCount.Add(1) + if sbc.NotServing { + return nil, vterrors.New(vtrpcpb.Code_FAILED_PRECONDITION, vterrors.NotServing) + } + if sbc.tablet.Type != target.TabletType { + return nil, vterrors.Errorf(vtrpcpb.Code_FAILED_PRECONDITION, "%s: %v, want: %v", vterrors.WrongTablet, target.TabletType, sbc.tablet.Type) + } bv := make(map[string]*querypb.BindVariable) for k, v := range bindVars { bv[k] = v @@ -557,6 +565,11 @@ func (sbc *SandboxConn) Tablet() *topodatapb.Tablet { return sbc.tablet } +// ChangeTabletType changes the tablet type. +func (sbc *SandboxConn) ChangeTabletType(typ topodatapb.TabletType) { + sbc.tablet.Type = typ +} + func (sbc *SandboxConn) getNextResult(stmt sqlparser.Statement) *sqltypes.Result { if len(sbc.results) != 0 { r := sbc.results[0] @@ -596,10 +609,6 @@ func (sbc *SandboxConn) setTxReservedID(transactionID int64, reservedID int64) { sbc.txIDToRID[transactionID] = reservedID } -func (sbc *SandboxConn) ResultsAllFetched() bool { - return len(sbc.results) == 0 -} - func (sbc *SandboxConn) getTxReservedID(txID int64) int64 { sbc.mapMu.Lock() defer sbc.mapMu.Unlock()