*: Check mutations for single-row changes (#27920)

* feat: check index key in AddRecord Signed-off-by: ekexium <ekexium@gmail.com> * feat: check for AddRecord/UpdateRecord Signed-off-by: ekexium <ekexium@gmail.com> * ignore deletion of indices if NeedRestoredData Signed-off-by: ekexium <ekexium@gmail.com> * check values of row mutations Signed-off-by: ekexium <ekexium@gmail.com> * style: fix naming Signed-off-by: ekexium <ekexium@gmail.com> * skip when sh == 0 Signed-off-by: ekexium <ekexium@gmail.com> * check in RemoveRecord Signed-off-by: ekexium <ekexium@gmail.com> * modify license header Signed-off-by: ekexium <ekexium@gmail.com> * test: add unit tests Signed-off-by: ekexium <ekexium@gmail.com> * add lisence header Signed-off-by: ekexium <ekexium@gmail.com> * also truncate decoded mutation Signed-off-by: ekexium <ekexium@gmail.com> * tidy up Signed-off-by: ekexium <ekexium@gmail.com> * refactor according to comments Signed-off-by: ekexium <ekexium@gmail.com> Auto stash before rebase of "ft-data-inconsistency" * skip partitioned table Signed-off-by: ekexium <ekexium@gmail.com> * save columnMap in stmtctx * skip when sh == 0 Some implementations of MemBuffer doesn't support staging. We don't care about them for now * reuse a slice in a loop * save reusable maps in stmtctx * save reusable maps in txn option * add unit test for checkIndexKeys * address comments in test
pingcap · Sep 22, 2021 · 2bece44 · 2bece44
1 parent 32c8c9e
commit 2bece44
Show file tree

Hide file tree

Showing 6 changed files with 646 additions and 5 deletions.
diff --git a/kv/option.go b/kv/option.go
@@ -70,6 +70,9 @@ const (
 	//		2. Ranges of Retrievers do not intersect each other.
 	//		3. Retrievers are sorted by range.
 	SortedCustomRetrievers
+	// TableToColumnMaps is a map from tableID to a series of maps. The maps are needed when checking data consistency.
+	// Save them here to reduce redundant computations.
+	TableToColumnMaps
 )
 
 // ReplicaReadType is the type of replica to read data from

diff --git a/sessionctx/variable/session.go b/sessionctx/variable/session.go
@@ -947,7 +947,7 @@ type SessionVars struct {
 	// MPPStoreFailTTL indicates the duration that protect TiDB from sending task to a new recovered TiFlash.
 	MPPStoreFailTTL string
 
-	// cached is used to optimze the object allocation.
+	// cached is used to optimize the object allocation.
 	cached struct {
 		curr int8
 		data [2]stmtctx.StatementContext

diff --git a/table/tables/mutation_checker.go b/table/tables/mutation_checker.go
@@ -0,0 +1,314 @@
+// Copyright 2021 PingCAP, Inc.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package tables
+
+import (
+	"fmt"
+
+	"github.com/pingcap/errors"
+	"github.com/pingcap/parser/model"
+	"github.com/pingcap/tidb/kv"
+	"github.com/pingcap/tidb/sessionctx/stmtctx"
+	"github.com/pingcap/tidb/sessionctx/variable"
+	"github.com/pingcap/tidb/table"
+	"github.com/pingcap/tidb/tablecodec"
+	"github.com/pingcap/tidb/types"
+	"github.com/pingcap/tidb/util/logutil"
+	"github.com/pingcap/tidb/util/rowcodec"
+	"go.uber.org/zap"
+)
+
+type mutation struct {
+	key   kv.Key
+	flags kv.KeyFlags
+	value []byte
+}
+
+type columnMaps struct {
+	ColumnIDToInfo       map[int64]*model.ColumnInfo
+	ColumnIDToFieldType  map[int64]*types.FieldType
+	IndexIDToInfo        map[int64]*model.IndexInfo
+	IndexIDToRowColInfos map[int64][]rowcodec.ColInfo
+}
+
+// CheckIndexConsistency checks whether the given set of mutations corresponding to a single row is consistent.
+// Namely, assume the database is consistent before, applying the mutations shouldn't break the consistency.
+// It aims at reducing bugs that will corrupt data, and preventing mistakes from spreading if possible.
+//
+// The check doesn't work and just returns nil when:
+// (1) the table is partitioned
+// (2) new collation is enabled and restored data is needed
+//
+// How it works:
+//
+// Assume the set of row values changes from V1 to V2, we check
+// (1) V2 - V1 = {added indices}
+// (2) V1 - V2 = {deleted indices}
+//
+// To check (1), we need
+// (a) {added indices} is a subset of {needed indices} => each index mutation is consistent with the input/row key/value
+// (b) {needed indices} is a subset of {added indices}. The check process would be exactly the same with how we generate
+// 		the mutations, thus ignored.
+func CheckIndexConsistency(
+	txn kv.Transaction, sessVars *variable.SessionVars, t *TableCommon,
+	rowToInsert, rowToRemove []types.Datum, memBuffer kv.MemBuffer, sh kv.StagingHandle,
+) error {
+	if t.Meta().GetPartitionInfo() != nil {
+		return nil
+	}
+	if sh == 0 {
+		// some implementations of MemBuffer doesn't support staging, e.g. that in br/pkg/lightning/backend/kv
+		return nil
+	}
+	indexMutations, rowInsertion, err := collectTableMutationsFromBufferStage(t, memBuffer, sh)
+	if err != nil {
+		return errors.Trace(err)
+	}
+
+	columnMaps := getColumnMaps(txn, t)
+
+	if rowToInsert != nil {
+		if err := checkRowInsertionConsistency(
+			sessVars, rowToInsert, rowInsertion, columnMaps.ColumnIDToInfo, columnMaps.ColumnIDToFieldType,
+		); err != nil {
+			return errors.Trace(err)
+		}
+	}
+	if err := checkIndexKeys(
+		sessVars, t, rowToInsert, rowToRemove, indexMutations, columnMaps.IndexIDToInfo, columnMaps.IndexIDToRowColInfos,
+	); err != nil {
+		return errors.Trace(err)
+	}
+	return nil
+}
+
+// checkIndexKeys checks whether the decoded data from keys of index mutations are consistent with the expected ones.
+func checkIndexKeys(
+	sessVars *variable.SessionVars, t *TableCommon, rowToInsert, rowToRemove []types.Datum,
+	indexMutations []mutation, indexIDToInfo map[int64]*model.IndexInfo,
+	indexIDToRowColInfos map[int64][]rowcodec.ColInfo,
+) error {
+
+	var indexData []types.Datum
+	for _, m := range indexMutations {
+		_, indexID, _, err := tablecodec.DecodeIndexKey(m.key)
+		if err != nil {
+			return errors.Trace(err)
+		}
+
+		indexInfo, ok := indexIDToInfo[indexID]
+		if !ok {
+			return errors.New("index not found")
+		}
+		rowColInfos, ok := indexIDToRowColInfos[indexID]
+		if !ok {
+			return errors.New("index not found")
+		}
+
+		// when we cannot decode the key to get the original value
+		if len(m.value) == 0 && NeedRestoredData(indexInfo.Columns, t.Meta().Columns) {
+			continue
+		}
+
+		decodedIndexValues, err := tablecodec.DecodeIndexKV(
+			m.key, m.value, len(indexInfo.Columns), tablecodec.HandleNotNeeded, rowColInfos,
+		)
+		if err != nil {
+			return errors.Trace(err)
+		}
+
+		// reuse the underlying memory, save an allocation
+		if indexData == nil {
+			indexData = make([]types.Datum, 0, len(decodedIndexValues))
+		} else {
+			indexData = indexData[:0]
+		}
+
+		for i, v := range decodedIndexValues {
+			fieldType := &t.Columns[indexInfo.Columns[i].Offset].FieldType
+			datum, err := tablecodec.DecodeColumnValue(v, fieldType, sessVars.Location())
+			if err != nil {
+				return errors.Trace(err)
+			}
+			indexData = append(indexData, datum)
+		}
+
+		if len(m.value) == 0 {
+			err = compareIndexData(sessVars.StmtCtx, t.Columns, indexData, rowToRemove, indexInfo)
+		} else {
+			err = compareIndexData(sessVars.StmtCtx, t.Columns, indexData, rowToInsert, indexInfo)
+		}
+		if err != nil {
+			return errors.Trace(err)
+		}
+	}
+	return nil
+}
+
+// checkRowInsertionConsistency checks whether the values of row mutations are consistent with the expected ones
+// We only check data added since a deletion of a row doesn't care about its value (and we cannot know it)
+func checkRowInsertionConsistency(
+	sessVars *variable.SessionVars, rowToInsert []types.Datum, rowInsertion mutation,
+	columnIDToInfo map[int64]*model.ColumnInfo, columnIDToFieldType map[int64]*types.FieldType,
+) error {
+	if rowToInsert == nil {
+		// it's a deletion
+		return nil
+	}
+
+	decodedData, err := tablecodec.DecodeRowToDatumMap(rowInsertion.value, columnIDToFieldType, sessVars.Location())
+	if err != nil {
+		return errors.Trace(err)
+	}
+
+	// NOTE: we cannot check if the decoded values contain all columns since some columns may be skipped. It can even be empty
+	// Instead, we check that decoded index values are consistent with the input row.
+
+	for columnID, decodedDatum := range decodedData {
+		inputDatum := rowToInsert[columnIDToInfo[columnID].Offset]
+		cmp, err := decodedDatum.CompareDatum(sessVars.StmtCtx, &inputDatum)
+		if err != nil {
+			return errors.Trace(err)
+		}
+		if cmp != 0 {
+			logutil.BgLogger().Error(
+				"inconsistent row mutation", zap.String("decoded datum", decodedDatum.String()),
+				zap.String("input datum", inputDatum.String()),
+			)
+			return errors.Errorf(
+				"inconsistent row mutation, row datum = {%v}, input datum = {%v}", decodedDatum.String(),
+				inputDatum.String(),
+			)
+		}
+	}
+	return nil
+}
+
+// collectTableMutationsFromBufferStage collects mutations of the current table from the mem buffer stage
+// It returns: (1) all index mutations (2) the only row insertion
+// If there are no row insertions, the 2nd returned value is nil
+// If there are multiple row insertions, an error is returned
+func collectTableMutationsFromBufferStage(t *TableCommon, memBuffer kv.MemBuffer, sh kv.StagingHandle) (
+	[]mutation, mutation, error,
+) {
+	indexMutations := make([]mutation, 0)
+	var rowInsertion mutation
+	var err error
+	inspector := func(key kv.Key, flags kv.KeyFlags, data []byte) {
+		// only check the current table
+		if tablecodec.DecodeTableID(key) == t.physicalTableID {
+			m := mutation{key, flags, data}
+			if rowcodec.IsRowKey(key) {
+				if len(data) > 0 {
+					if rowInsertion.key == nil {
+						rowInsertion = m
+					} else {
+						err = errors.Errorf(
+							"multiple row mutations added/mutated, one = %+v, another = %+v", rowInsertion, m,
+						)
+					}
+				}
+			} else {
+				indexMutations = append(indexMutations, m)
+			}
+		}
+	}
+	memBuffer.InspectStage(sh, inspector)
+	return indexMutations, rowInsertion, err
+}
+
+// compareIndexData compares the decoded index data with the input data.
+// Returns error if the index data is not a subset of the input data.
+func compareIndexData(
+	sc *stmtctx.StatementContext, cols []*table.Column, indexData, input []types.Datum, indexInfo *model.IndexInfo,
+) error {
+	for i, decodedMutationDatum := range indexData {
+		expectedDatum := input[indexInfo.Columns[i].Offset]
+
+		tablecodec.TruncateIndexValue(
+			&expectedDatum, indexInfo.Columns[i],
+			cols[indexInfo.Columns[i].Offset].ColumnInfo,
+		)
+		tablecodec.TruncateIndexValue(
+			&decodedMutationDatum, indexInfo.Columns[i],
+			cols[indexInfo.Columns[i].Offset].ColumnInfo,
+		)
+
+		comparison, err := decodedMutationDatum.CompareDatum(sc, &expectedDatum)
+		if err != nil {
+			return errors.Trace(err)
+		}
+
+		if comparison != 0 {
+			logutil.BgLogger().Error(
+				"inconsistent index values",
+				zap.String("truncated mutation datum", fmt.Sprintf("%v", decodedMutationDatum)),
+				zap.String("truncated expected datum", fmt.Sprintf("%v", expectedDatum)),
+			)
+			return errors.New("inconsistent index values")
+		}
+	}
+	return nil
+}
+
+// getColumnMaps tries to get the columnMaps from transaction options. If there isn't one, it builds one and stores it.
+// It saves redundant computations of the map.
+func getColumnMaps(txn kv.Transaction, t *TableCommon) columnMaps {
+	getter := func() (map[int64]columnMaps, bool) {
+		m, ok := txn.GetOption(kv.TableToColumnMaps).(map[int64]columnMaps)
+		return m, ok
+	}
+	setter := func(maps map[int64]columnMaps) {
+		txn.SetOption(kv.TableToColumnMaps, maps)
+	}
+	columnMaps := getOrBuildColumnMaps(getter, setter, t)
+	return columnMaps
+}
+
+// getOrBuildColumnMaps tries to get the columnMaps from some place. If there isn't one, it builds one and stores it.
+// It saves redundant computations of the map.
+func getOrBuildColumnMaps(
+	getter func() (map[int64]columnMaps, bool), setter func(map[int64]columnMaps), t *TableCommon,
+) columnMaps {
+	tableMaps, ok := getter()
+	if !ok || tableMaps == nil {
+		tableMaps = make(map[int64]columnMaps)
+	}
+	maps, ok := tableMaps[t.tableID]
+	if !ok {
+		maps = columnMaps{
+			make(map[int64]*model.ColumnInfo, len(t.Meta().Columns)),
+			make(map[int64]*types.FieldType, len(t.Meta().Columns)),
+			make(map[int64]*model.IndexInfo, len(t.Indices())),
+			make(map[int64][]rowcodec.ColInfo, len(t.Indices())),
+		}
+
+		for _, col := range t.Meta().Columns {
+			maps.ColumnIDToInfo[col.ID] = col
+			maps.ColumnIDToFieldType[col.ID] = &col.FieldType
+		}
+		for _, index := range t.Indices() {
+			if index.Meta().Primary && t.meta.IsCommonHandle {
+				continue
+			}
+			maps.IndexIDToInfo[index.Meta().ID] = index.Meta()
+			maps.IndexIDToRowColInfos[index.Meta().ID] = BuildRowcodecColInfoForIndexColumns(index.Meta(), t.Meta())
+		}
+
+		tableMaps[t.tableID] = maps
+		setter(tableMaps)
+	}
+	return maps
+}