Skip to content

Commit

Permalink
copIterator: return context error to avoid return incorrect result on…
Browse files Browse the repository at this point in the history
… context cancel/timeout (#53489) (#55638)

close #50089
  • Loading branch information
ti-chi-bot authored Sep 14, 2024
1 parent 9b45610 commit 271edfd
Show file tree
Hide file tree
Showing 4 changed files with 105 additions and 39 deletions.
4 changes: 3 additions & 1 deletion pkg/ddl/backfilling_operators.go
Original file line number Diff line number Diff line change
Expand Up @@ -728,7 +728,9 @@ func (w *indexIngestBaseWorker) WriteChunk(rs *IndexRecordChunk) (count int, nex
failpoint.Return(0, nil, errors.New("mock write local error"))
})
failpoint.Inject("writeLocalExec", func(_ failpoint.Value) {
OperatorCallBackForTest()
if rs.Done {
OperatorCallBackForTest()
}
})

oprStartTime := time.Now()
Expand Down
36 changes: 36 additions & 0 deletions pkg/executor/adapter_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -15,13 +15,19 @@
package executor_test

import (
"context"
"sync"
"testing"
"time"

"github.com/pingcap/failpoint"
"github.com/pingcap/tidb/pkg/executor"
"github.com/pingcap/tidb/pkg/session"
"github.com/pingcap/tidb/pkg/sessionctx/variable"
"github.com/pingcap/tidb/pkg/store/copr"
"github.com/pingcap/tidb/pkg/testkit"
"github.com/stretchr/testify/require"
"github.com/tikv/client-go/v2/util"
)

func TestQueryTime(t *testing.T) {
Expand Down Expand Up @@ -52,3 +58,33 @@ func TestFormatSQL(t *testing.T) {
val = executor.FormatSQL("aaaaaaaaaaaaaaaaaaaa")
require.Equal(t, "aaaaa(len:20)", val.String())
}

func TestContextCancelWhenReadFromCopIterator(t *testing.T) {
store := testkit.CreateMockStore(t)
tk := testkit.NewTestKit(t, store)
tk.MustExec("use test")
tk.MustExec("create table t(a int)")
tk.MustExec("insert into t values(1)")

require.NoError(t, failpoint.Enable("github.com/pingcap/tidb/pkg/store/copr/CtxCancelBeforeReceive", "return(true)"))
defer func() {
require.NoError(t, failpoint.Disable("github.com/pingcap/tidb/pkg/store/copr/CtxCancelBeforeReceive"))
}()
ctx := context.WithValue(context.Background(), "TestContextCancel", "test")
ctx, cancelFunc := context.WithCancel(ctx)
defer cancelFunc()
var wg sync.WaitGroup
wg.Add(1)
go func() {
defer wg.Done()
ctx = util.WithInternalSourceType(ctx, "scheduler")
rs, err := tk.Session().ExecuteInternal(ctx, "select * from test.t")
require.NoError(t, err)
_, err2 := session.ResultSetToStringSlice(ctx, tk.Session(), rs)
require.ErrorIs(t, err2, context.Canceled)
}()
<-copr.GlobalSyncChForTest
cancelFunc()
copr.GlobalSyncChForTest <- struct{}{}
wg.Wait()
}
15 changes: 12 additions & 3 deletions pkg/store/copr/coprocessor.go
Original file line number Diff line number Diff line change
Expand Up @@ -915,7 +915,16 @@ func (sender *copIteratorTaskSender) run(connID uint64) {
}
}

// GlobalSyncChForTest is a global channel for test.
var GlobalSyncChForTest = make(chan struct{})

func (it *copIterator) recvFromRespCh(ctx context.Context, respCh <-chan *copResponse) (resp *copResponse, ok bool, exit bool) {
failpoint.Inject("CtxCancelBeforeReceive", func(_ failpoint.Value) {
if ctx.Value("TestContextCancel") == "test" {
GlobalSyncChForTest <- struct{}{}
<-GlobalSyncChForTest
}
})
ticker := time.NewTicker(3 * time.Second)
defer ticker.Stop()
for {
Expand Down Expand Up @@ -1052,7 +1061,7 @@ func (it *copIterator) Next(ctx context.Context) (kv.ResultSubset, error) {
resp, ok, closed = it.recvFromRespCh(ctx, it.respChan)
if !ok || closed {
it.actionOnExceed.close()
return nil, nil
return nil, errors.Trace(ctx.Err())
}
if resp == finCopResp {
it.actionOnExceed.destroyTokenIfNeeded(func() {
Expand All @@ -1070,8 +1079,8 @@ func (it *copIterator) Next(ctx context.Context) (kv.ResultSubset, error) {
task := it.tasks[it.curr]
resp, ok, closed = it.recvFromRespCh(ctx, task.respChan)
if closed {
// Close() is already called, so Next() is invalid.
return nil, nil
// Close() is called or context cancelled/timeout, so Next() is invalid.
return nil, errors.Trace(ctx.Err())
}
if ok {
break
Expand Down
89 changes: 54 additions & 35 deletions tests/realtikvtest/addindextest3/operator_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@ package addindextest
import (
"context"
"fmt"
"strings"
"sync/atomic"
"testing"

Expand Down Expand Up @@ -231,7 +232,7 @@ func TestBackfillOperatorPipelineException(t *testing.T) {
{
failPointPath: "github.com/pingcap/tidb/pkg/ddl/scanRecordExec",
closeErrMsg: "context canceled",
operatorErrMsg: "",
operatorErrMsg: "context canceled",
},
{
failPointPath: "github.com/pingcap/tidb/pkg/ddl/mockWriteLocalError",
Expand All @@ -251,41 +252,59 @@ func TestBackfillOperatorPipelineException(t *testing.T) {
}

for _, tc := range testCase {
require.NoError(t, failpoint.Enable(tc.failPointPath, `return`))
ctx, cancel := context.WithCancel(context.Background())
ddl.OperatorCallBackForTest = func() {
t.Run(tc.failPointPath, func(t *testing.T) {
require.NoError(t, failpoint.Enable(tc.failPointPath, `return`))
defer func() {
require.NoError(t, failpoint.Disable(tc.failPointPath))
}()
ctx, cancel := context.WithCancel(context.Background())
if strings.Contains(tc.failPointPath, "writeLocalExec") {
var counter atomic.Int32
ddl.OperatorCallBackForTest = func() {
// we need to want all tableScanWorkers finish scanning, else
// fetchTableScanResult will might return context error, and cause
// the case fail.
// 10 is the table scan task count.
counter.Add(1)
if counter.Load() == 10 {
cancel()
}
}
} else {
ddl.OperatorCallBackForTest = func() {
cancel()
}
}
opCtx := ddl.NewOperatorCtx(ctx)
pipeline, err := ddl.NewAddIndexIngestPipeline(
opCtx, store,
sessPool,
mockBackendCtx,
[]ingest.Engine{mockEngine},
tk.Session(),
tbl.(table.PhysicalTable),
[]*model.IndexInfo{idxInfo},
startKey,
endKey,
&atomic.Int64{},
nil,
ddl.NewDDLReorgMeta(tk.Session()),
)
require.NoError(t, err)
err = pipeline.Execute()
require.NoError(t, err)
err = pipeline.Close()
comment := fmt.Sprintf("case: %s", tc.failPointPath)
require.ErrorContains(t, err, tc.closeErrMsg, comment)
opCtx.Cancel()
if tc.operatorErrMsg == "" {
require.NoError(t, opCtx.OperatorErr())
} else {
require.Error(t, opCtx.OperatorErr())
require.Equal(t, tc.operatorErrMsg, opCtx.OperatorErr().Error())
}
cancel()
}
opCtx := ddl.NewOperatorCtx(ctx)
pipeline, err := ddl.NewAddIndexIngestPipeline(
opCtx, store,
sessPool,
mockBackendCtx,
[]ingest.Engine{mockEngine},
tk.Session(),
tbl.(table.PhysicalTable),
[]*model.IndexInfo{idxInfo},
startKey,
endKey,
&atomic.Int64{},
nil,
ddl.NewDDLReorgMeta(tk.Session()),
)
require.NoError(t, err)
err = pipeline.Execute()
require.NoError(t, err)
err = pipeline.Close()
comment := fmt.Sprintf("case: %s", tc.failPointPath)
require.ErrorContains(t, err, tc.closeErrMsg, comment)
opCtx.Cancel()
if tc.operatorErrMsg == "" {
require.NoError(t, opCtx.OperatorErr())
} else {
require.Error(t, opCtx.OperatorErr())
require.Equal(t, tc.operatorErrMsg, opCtx.OperatorErr().Error())
}
require.NoError(t, failpoint.Disable(tc.failPointPath))
cancel()
})
}
}

Expand Down

0 comments on commit 271edfd

Please sign in to comment.