From d4496bd7bd1412ce0b35c41a71788ea91e18dd41 Mon Sep 17 00:00:00 2001
From: lance6716 <lance6716@gmail.com>
Date: Wed, 11 Dec 2024 15:20:57 +0800
Subject: [PATCH] This is an automated cherry-pick of #58148

Signed-off-by: ti-chi-bot <ti-community-prow-bot@tidb.io>
---
 pkg/lightning/errormanager/errormanager.go    | 1145 +++++++++++++++++
 .../errormanager/errormanager_test.go         |  724 +++++++++++
 2 files changed, 1869 insertions(+)
 create mode 100644 pkg/lightning/errormanager/errormanager.go
 create mode 100644 pkg/lightning/errormanager/errormanager_test.go

diff --git a/pkg/lightning/errormanager/errormanager.go b/pkg/lightning/errormanager/errormanager.go
new file mode 100644
index 0000000000000..10e68266d77fd
--- /dev/null
+++ b/pkg/lightning/errormanager/errormanager.go
@@ -0,0 +1,1145 @@
+// Copyright 2021 PingCAP, Inc.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package errormanager
+
+import (
+	"bytes"
+	"context"
+	"database/sql"
+	"fmt"
+	"math"
+	"strings"
+	"sync"
+
+	"github.com/jedib0t/go-pretty/v6/table"
+	"github.com/jedib0t/go-pretty/v6/text"
+	"github.com/pingcap/errors"
+	"github.com/pingcap/tidb/br/pkg/logutil"
+	"github.com/pingcap/tidb/pkg/lightning/backend/encode"
+	"github.com/pingcap/tidb/pkg/lightning/backend/kv"
+	"github.com/pingcap/tidb/pkg/lightning/common"
+	"github.com/pingcap/tidb/pkg/lightning/config"
+	"github.com/pingcap/tidb/pkg/lightning/log"
+	"github.com/pingcap/tidb/pkg/parser/mysql"
+	tidbtbl "github.com/pingcap/tidb/pkg/table"
+	"github.com/pingcap/tidb/pkg/table/tables"
+	"github.com/pingcap/tidb/pkg/tablecodec"
+	"github.com/pingcap/tidb/pkg/types"
+	"github.com/pingcap/tidb/pkg/util"
+	"github.com/pingcap/tidb/pkg/util/redact"
+	tikverr "github.com/tikv/client-go/v2/error"
+	"go.uber.org/atomic"
+	"go.uber.org/multierr"
+	"go.uber.org/zap"
+	"golang.org/x/exp/slices"
+	"golang.org/x/sync/errgroup"
+)
+
+const (
+	createSchema = `
+		CREATE SCHEMA IF NOT EXISTS %s;
+	`
+
+	syntaxErrorTableName = "syntax_error_v2"
+	typeErrorTableName   = "type_error_v2"
+	// ConflictErrorTableName is the table name for duplicate detection.
+	ConflictErrorTableName = "conflict_error_v4"
+	// DupRecordTableName is the table name to record duplicate data that displayed to user.
+	DupRecordTableName = "conflict_records_v2"
+	// ConflictViewName is the view name for presenting the union information of ConflictErrorTable and DupRecordTable.
+	ConflictViewName = "conflict_view"
+
+	createSyntaxErrorTable = `
+		CREATE TABLE IF NOT EXISTS %s.` + syntaxErrorTableName + ` (
+			id 	    	bigint PRIMARY KEY AUTO_INCREMENT,
+			task_id     bigint NOT NULL,
+			create_time datetime(6) NOT NULL DEFAULT now(6),
+			table_name  varchar(261) NOT NULL,
+			path        varchar(2048) NOT NULL,
+			offset      bigint NOT NULL,
+			error       text NOT NULL,
+			context     text
+		);
+	`
+
+	createTypeErrorTable = `
+		CREATE TABLE IF NOT EXISTS %s.` + typeErrorTableName + ` (
+			id		    bigint PRIMARY KEY AUTO_INCREMENT,
+			task_id     bigint NOT NULL,
+			create_time datetime(6) NOT NULL DEFAULT now(6),
+			table_name  varchar(261) NOT NULL,
+			path        varchar(2048) NOT NULL,
+			offset      bigint NOT NULL,
+			error       text NOT NULL,
+			row_data    text NOT NULL
+		);
+	`
+
+	createConflictErrorTable = `
+		CREATE TABLE IF NOT EXISTS %s.` + ConflictErrorTableName + ` (
+			id          bigint PRIMARY KEY AUTO_INCREMENT,
+			task_id     bigint NOT NULL,
+			create_time datetime(6) NOT NULL DEFAULT now(6),
+			table_name  varchar(261) NOT NULL,
+			index_name  varchar(128) NOT NULL,
+			key_data    text COMMENT 'decoded from raw_key, human readable only, not for machine use',
+			row_data    text COMMENT 'decoded from raw_row, human readable only, not for machine use',
+			raw_key     mediumblob NOT NULL COMMENT 'the conflicted key',
+			raw_value   mediumblob NOT NULL COMMENT 'the value of the conflicted key',
+			raw_handle  mediumblob NOT NULL COMMENT 'the data handle derived from the conflicted key or value',
+			raw_row     mediumblob NOT NULL COMMENT 'the data retrieved from the handle',
+			kv_type     tinyint(1) NOT NULL COMMENT '0 for index kv, 1 for data kv, 2 for additionally inserted data kv',
+			INDEX (task_id, table_name),
+			INDEX (index_name),
+			INDEX (table_name, index_name),
+			INDEX (kv_type)
+		);
+	`
+
+	createDupRecordTableName = `
+		CREATE TABLE IF NOT EXISTS %s.` + DupRecordTableName + ` (
+			id          bigint PRIMARY KEY AUTO_INCREMENT,
+			task_id     bigint NOT NULL,
+			create_time datetime(6) NOT NULL DEFAULT now(6),
+			table_name  varchar(261) NOT NULL,
+			path        varchar(2048) NOT NULL,
+			offset      bigint NOT NULL,
+			error       text NOT NULL,
+			row_id 	    bigint NOT NULL COMMENT 'the row id of the conflicted row',
+			row_data    text NOT NULL COMMENT 'the row data of the conflicted row',
+			KEY (task_id, table_name)
+		);
+	`
+
+	createConflictV1View = `
+    	CREATE OR REPLACE VIEW %s.` + ConflictViewName + `
+			AS SELECT 0 AS is_precheck_conflict, task_id, create_time, table_name, index_name, key_data, row_data,
+			raw_key, raw_value, raw_handle, raw_row, kv_type, NULL AS path, NULL AS offset, NULL AS error, NULL AS row_id
+			FROM %s.` + ConflictErrorTableName + `;
+	`
+
+	createConflictV2View = `
+    	CREATE OR REPLACE VIEW %s.` + ConflictViewName + `
+			AS SELECT 1 AS is_precheck_conflict, task_id, create_time, table_name, NULL AS index_name, NULL AS key_data,
+			row_data, NULL AS raw_key, NULL AS raw_value, NULL AS raw_handle, NULL AS raw_row, NULL AS kv_type, path,
+			offset, error, row_id FROM %s.` + DupRecordTableName + `;
+	`
+
+	createConflictV1V2View = `
+    	CREATE OR REPLACE VIEW %s.` + ConflictViewName + `
+			AS SELECT 0 AS is_precheck_conflict, task_id, create_time, table_name, index_name, key_data, row_data,
+			raw_key, raw_value, raw_handle, raw_row, kv_type, NULL AS path, NULL AS offset, NULL AS error, NULL AS row_id
+			FROM %s.` + ConflictErrorTableName + `
+			UNION ALL SELECT 1 AS is_precheck_conflict, task_id, create_time, table_name, NULL AS index_name, NULL AS key_data,
+			row_data, NULL AS raw_key, NULL AS raw_value, NULL AS raw_handle, NULL AS raw_row, NULL AS kv_type, path,
+			offset, error, row_id FROM %s.` + DupRecordTableName + `;
+	`
+
+	insertIntoTypeError = `
+		INSERT INTO %s.` + typeErrorTableName + `
+		(task_id, table_name, path, offset, error, row_data)
+		VALUES (?, ?, ?, ?, ?, ?);
+	`
+
+	insertIntoConflictErrorData = `
+		INSERT INTO %s.` + ConflictErrorTableName + `
+		(task_id, table_name, index_name, key_data, row_data, raw_key, raw_value, raw_handle, raw_row, kv_type)
+		VALUES
+	`
+
+	sqlValuesConflictErrorData = "(?,?,'PRIMARY',?,?,?,?,raw_key,raw_value,?)"
+
+	insertIntoConflictErrorIndex = `
+		INSERT INTO %s.` + ConflictErrorTableName + `
+		(task_id, table_name, index_name, key_data, row_data, raw_key, raw_value, raw_handle, raw_row, kv_type)
+		VALUES
+	`
+
+	sqlValuesConflictErrorIndex = "(?,?,?,?,?,?,?,?,?,?)"
+
+	selectIndexConflictKeysReplace = `
+		SELECT id, raw_key, index_name, raw_value, raw_handle
+		FROM %s.` + ConflictErrorTableName + `
+		WHERE table_name = ? AND kv_type = 0 AND id >= ? and id < ?
+		ORDER BY id LIMIT ?;
+	`
+
+	selectDataConflictKeysReplace = `
+		SELECT id, raw_key, raw_value
+		FROM %s.` + ConflictErrorTableName + `
+		WHERE table_name = ? AND kv_type <> 0 AND id >= ? and id < ?
+		ORDER BY id LIMIT ?;
+	`
+
+	deleteNullDataRow = `
+		DELETE FROM %s.` + ConflictErrorTableName + `
+		WHERE kv_type = 2
+		LIMIT ?;
+	`
+
+	insertIntoDupRecord = `
+		INSERT INTO %s.` + DupRecordTableName + `
+		(task_id, table_name, path, offset, error, row_id, row_data)
+		VALUES (?, ?, ?, ?, ?, ?, ?);
+	`
+)
+
+// ErrorManager records errors during the import process.
+type ErrorManager struct {
+	db             *sql.DB
+	taskID         int64
+	schema         string
+	configError    *config.MaxError
+	remainingError config.MaxError
+
+	configConflict        *config.Conflict
+	conflictErrRemain     *atomic.Int64
+	conflictRecordsRemain *atomic.Int64
+	conflictV1Enabled     bool
+	conflictV2Enabled     bool
+	logger                log.Logger
+	recordErrorOnce       *atomic.Bool
+}
+
+// TypeErrorsRemain returns the number of type errors that can be recorded.
+func (em *ErrorManager) TypeErrorsRemain() int64 {
+	return em.remainingError.Type.Load()
+}
+
+// ConflictErrorsRemain returns the number of conflict errors that can be recorded.
+func (em *ErrorManager) ConflictErrorsRemain() int64 {
+	return em.conflictErrRemain.Load()
+}
+
+// ConflictRecordsRemain returns the number of errors that need be recorded.
+func (em *ErrorManager) ConflictRecordsRemain() int64 {
+	return em.conflictRecordsRemain.Load()
+}
+
+// RecordErrorOnce returns if RecordDuplicateOnce has been called. Not that this
+// method is not atomic with RecordDuplicateOnce.
+func (em *ErrorManager) RecordErrorOnce() bool {
+	return em.recordErrorOnce.Load()
+}
+
+// New creates a new error manager.
+func New(db *sql.DB, cfg *config.Config, logger log.Logger) *ErrorManager {
+	conflictErrRemain := atomic.NewInt64(cfg.Conflict.Threshold)
+	conflictRecordsRemain := atomic.NewInt64(cfg.Conflict.MaxRecordRows)
+	em := &ErrorManager{
+		taskID:                cfg.TaskID,
+		configError:           &cfg.App.MaxError,
+		remainingError:        cfg.App.MaxError,
+		conflictV1Enabled:     cfg.TikvImporter.Backend == config.BackendLocal && cfg.Conflict.Strategy != config.NoneOnDup,
+		configConflict:        &cfg.Conflict,
+		conflictErrRemain:     conflictErrRemain,
+		conflictRecordsRemain: conflictRecordsRemain,
+		logger:                logger,
+		recordErrorOnce:       atomic.NewBool(false),
+	}
+	switch cfg.TikvImporter.Backend {
+	case config.BackendLocal:
+		if cfg.Conflict.PrecheckConflictBeforeImport && cfg.Conflict.Strategy != config.NoneOnDup {
+			em.conflictV2Enabled = true
+		}
+	case config.BackendTiDB:
+		em.conflictV2Enabled = true
+	}
+	if len(cfg.App.TaskInfoSchemaName) != 0 {
+		em.db = db
+		em.schema = cfg.App.TaskInfoSchemaName
+	}
+	return em
+}
+
+// Init creates the schemas and tables to store the task information.
+func (em *ErrorManager) Init(ctx context.Context) error {
+	if em.db == nil {
+		return nil
+	}
+
+	exec := common.SQLWithRetry{
+		DB:     em.db,
+		Logger: em.logger,
+	}
+
+	sqls := make([][2]string, 0)
+	sqls = append(sqls, [2]string{"create task info schema", createSchema})
+	if em.remainingError.Syntax.Load() > 0 {
+		sqls = append(sqls, [2]string{"create syntax error table", createSyntaxErrorTable})
+	}
+	if em.remainingError.Type.Load() > 0 {
+		sqls = append(sqls, [2]string{"create type error table", createTypeErrorTable})
+	}
+	if em.conflictV1Enabled {
+		sqls = append(sqls, [2]string{"create conflict error table", createConflictErrorTable})
+	}
+	if em.conflictV2Enabled {
+		sqls = append(sqls, [2]string{"create duplicate records table", createDupRecordTableName})
+	}
+
+	// No need to create task info schema if no error is allowed.
+	if len(sqls) == 1 {
+		return nil
+	}
+
+	for _, sql := range sqls {
+		// trim spaces for unit test pattern matching
+		err := exec.Exec(ctx, sql[0], strings.TrimSpace(common.SprintfWithIdentifiers(sql[1], em.schema)))
+		if err != nil {
+			return err
+		}
+	}
+
+	if em.conflictV1Enabled && em.conflictV2Enabled {
+		err := exec.Exec(ctx, "create conflict view", strings.TrimSpace(common.SprintfWithIdentifiers(createConflictV1V2View, em.schema, em.schema, em.schema)))
+		if err != nil {
+			return err
+		}
+	} else if em.conflictV1Enabled {
+		err := exec.Exec(ctx, "create conflict view", strings.TrimSpace(common.SprintfWithIdentifiers(createConflictV1View, em.schema, em.schema)))
+		if err != nil {
+			return err
+		}
+	} else if em.conflictV2Enabled {
+		err := exec.Exec(ctx, "create conflict view", strings.TrimSpace(common.SprintfWithIdentifiers(createConflictV2View, em.schema, em.schema)))
+		if err != nil {
+			return err
+		}
+	}
+
+	return nil
+}
+
+// RecordTypeError records a type error.
+// If the number of recorded type errors exceed the max-error count, also returns `err` directly.
+func (em *ErrorManager) RecordTypeError(
+	ctx context.Context,
+	logger log.Logger,
+	tableName string,
+	path string,
+	offset int64,
+	rowText string,
+	encodeErr error,
+) error {
+	// elide the encode error if needed.
+	if em.remainingError.Type.Dec() < 0 {
+		threshold := em.configError.Type.Load()
+		if threshold > 0 {
+			encodeErr = errors.Annotatef(encodeErr,
+				"The number of type errors exceeds the threshold configured by `max-error.type`: '%d'",
+				em.configError.Type.Load())
+		}
+		return encodeErr
+	}
+
+	if em.db != nil {
+		errMsg := encodeErr.Error()
+		logger = logger.With(
+			zap.Int64("offset", offset),
+			zap.String("row", redact.Value(rowText)),
+			zap.String("message", errMsg))
+
+		// put it into the database.
+		exec := common.SQLWithRetry{
+			DB:           em.db,
+			Logger:       logger,
+			HideQueryLog: redact.NeedRedact(),
+		}
+		if err := exec.Exec(ctx, "insert type error record",
+			common.SprintfWithIdentifiers(insertIntoTypeError, em.schema),
+			em.taskID,
+			tableName,
+			path,
+			offset,
+			errMsg,
+			rowText,
+		); err != nil {
+			return multierr.Append(encodeErr, err)
+		}
+	}
+	return nil
+}
+
+// DataConflictInfo is the information of a data conflict error.
+type DataConflictInfo struct {
+	RawKey   []byte
+	RawValue []byte
+	KeyData  string
+	Row      string
+}
+
+// RecordDataConflictError records a data conflict error.
+func (em *ErrorManager) RecordDataConflictError(
+	ctx context.Context,
+	logger log.Logger,
+	tableName string,
+	conflictInfos []DataConflictInfo,
+) error {
+	var gerr error
+	if len(conflictInfos) == 0 {
+		return nil
+	}
+
+	if em.conflictErrRemain.Sub(int64(len(conflictInfos))) < 0 {
+		threshold := em.configConflict.Threshold
+		// Still need to record this batch of conflict records, and then return this error at last.
+		// Otherwise, if the max-error.conflict is set a very small value, none of the conflict errors will be recorded
+		gerr = errors.Errorf(
+			"The number of conflict errors exceeds the threshold configured by `conflict.threshold`: '%d'",
+			threshold)
+	}
+
+	if em.db == nil {
+		return gerr
+	}
+
+	exec := common.SQLWithRetry{
+		DB:           em.db,
+		Logger:       logger,
+		HideQueryLog: redact.NeedRedact(),
+	}
+	if err := exec.Transact(ctx, "insert data conflict error record", func(c context.Context, txn *sql.Tx) error {
+		sb := &strings.Builder{}
+		_, err := common.FprintfWithIdentifiers(sb, insertIntoConflictErrorData, em.schema)
+		if err != nil {
+			return err
+		}
+		var sqlArgs []any
+		for i, conflictInfo := range conflictInfos {
+			if i > 0 {
+				sb.WriteByte(',')
+			}
+			sb.WriteString(sqlValuesConflictErrorData)
+			sqlArgs = append(sqlArgs,
+				em.taskID,
+				tableName,
+				conflictInfo.KeyData,
+				conflictInfo.Row,
+				conflictInfo.RawKey,
+				conflictInfo.RawValue,
+				tablecodec.IsRecordKey(conflictInfo.RawKey),
+			)
+		}
+		_, err = txn.ExecContext(c, sb.String(), sqlArgs...)
+		return err
+	}); err != nil {
+		gerr = err
+	}
+	return gerr
+}
+
+// RecordIndexConflictError records a index conflict error.
+func (em *ErrorManager) RecordIndexConflictError(
+	ctx context.Context,
+	logger log.Logger,
+	tableName string,
+	indexNames []string,
+	conflictInfos []DataConflictInfo,
+	rawHandles, rawRows [][]byte,
+) error {
+	var gerr error
+	if len(conflictInfos) == 0 {
+		return nil
+	}
+
+	if em.conflictErrRemain.Sub(int64(len(conflictInfos))) < 0 {
+		threshold := em.configConflict.Threshold
+		// Still need to record this batch of conflict records, and then return this error at last.
+		// Otherwise, if the max-error.conflict is set a very small value, non of the conflict errors will be recorded
+		gerr = errors.Errorf(
+			"The number of conflict errors exceeds the threshold configured by `conflict.threshold`: '%d'",
+			threshold)
+	}
+
+	if em.db == nil {
+		return gerr
+	}
+
+	exec := common.SQLWithRetry{
+		DB:           em.db,
+		Logger:       logger,
+		HideQueryLog: redact.NeedRedact(),
+	}
+	if err := exec.Transact(ctx, "insert index conflict error record", func(c context.Context, txn *sql.Tx) error {
+		sb := &strings.Builder{}
+		_, err := common.FprintfWithIdentifiers(sb, insertIntoConflictErrorIndex, em.schema)
+		if err != nil {
+			return err
+		}
+		var sqlArgs []any
+		for i, conflictInfo := range conflictInfos {
+			if i > 0 {
+				sb.WriteByte(',')
+			}
+			sb.WriteString(sqlValuesConflictErrorIndex)
+			sqlArgs = append(sqlArgs,
+				em.taskID,
+				tableName,
+				indexNames[i],
+				conflictInfo.KeyData,
+				conflictInfo.Row,
+				conflictInfo.RawKey,
+				conflictInfo.RawValue,
+				rawHandles[i],
+				rawRows[i],
+				tablecodec.IsRecordKey(conflictInfo.RawKey),
+			)
+		}
+		_, err = txn.ExecContext(c, sb.String(), sqlArgs...)
+		return err
+	}); err != nil {
+		gerr = err
+	}
+	return gerr
+}
+
+// ReplaceConflictKeys query all conflicting rows (handle and their
+// values) from the current error report and resolve them
+// by replacing the necessary rows and reserving the others.
+func (em *ErrorManager) ReplaceConflictKeys(
+	ctx context.Context,
+	tbl tidbtbl.Table,
+	tableName string,
+	pool *util.WorkerPool,
+	fnGetLatest func(ctx context.Context, key []byte) ([]byte, error),
+	fnDeleteKeys func(ctx context.Context, key [][]byte) error,
+) error {
+	if em.db == nil {
+		return nil
+	}
+
+	exec := common.SQLWithRetry{
+		DB:           em.db,
+		Logger:       em.logger,
+		HideQueryLog: redact.NeedRedact(),
+	}
+
+	const rowLimit = 1000
+	indexTaskCh := make(chan [2]int64)
+	indexTaskWg := &sync.WaitGroup{}
+	indexG, indexGCtx := errgroup.WithContext(ctx)
+
+	go func() {
+		//nolint:staticcheck
+		//lint:ignore SA2000
+		indexTaskWg.Add(1)
+		indexTaskCh <- [2]int64{0, math.MaxInt64}
+		indexTaskWg.Wait()
+		close(indexTaskCh)
+	}()
+
+	// TODO: provide a detailed document to explain the algorithm and link it here
+	// demo for "replace" algorithm: https://github.com/lyzx2001/tidb-conflict-replace
+	// check index KV
+	for t := range indexTaskCh {
+		start, end := t[0], t[1]
+		pool.ApplyOnErrorGroup(indexG, func() error {
+			defer indexTaskWg.Done()
+
+			sessionOpts := encode.SessionOptions{
+				// TODO: need to find the correct value for SQLMode
+				SQLMode: mysql.ModeStrictAllTables,
+			}
+			encoder, err := kv.NewBaseKVEncoder(&encode.EncodingConfig{
+				Table:          tbl,
+				SessionOptions: sessionOpts,
+				Logger:         em.logger,
+			})
+			if err != nil {
+				return errors.Trace(err)
+			}
+
+			var handleKeys [][]byte
+			var insertRows [][2][]byte
+			for start < end {
+				indexKvRows, err := em.db.QueryContext(
+					indexGCtx, common.SprintfWithIdentifiers(selectIndexConflictKeysReplace, em.schema),
+					tableName, start, end, rowLimit)
+				if err != nil {
+					return errors.Trace(err)
+				}
+
+				var lastRowID int64
+				for indexKvRows.Next() {
+					var rawKey, rawValue, rawHandle []byte
+					var indexName string
+					if err := indexKvRows.Scan(&lastRowID, &rawKey, &indexName, &rawValue, &rawHandle); err != nil {
+						return errors.Trace(err)
+					}
+					em.logger.Debug("got raw_key, index_name, raw_value, raw_handle from table",
+						zap.Binary("raw_key", rawKey),
+						zap.String("index_name", indexName),
+						zap.Binary("raw_value", rawValue),
+						zap.Binary("raw_handle", rawHandle))
+
+					// get the latest value of rawKey from downstream TiDB
+					latestValue, err := fnGetLatest(indexGCtx, rawKey)
+					if tikverr.IsErrNotFound(err) {
+						continue
+					}
+					if err != nil {
+						return errors.Trace(err)
+					}
+
+					// if the latest value of rawKey equals to rawValue, that means this index KV is maintained in downstream TiDB
+					// if not, that means this index KV has been overwritten, and its corresponding data KV needs to be deleted
+					if bytes.Equal(rawValue, latestValue) {
+						continue
+					}
+
+					// rawHandle is the row key of the data KV that needs to be deleted
+					// get the latest value of the row key of the data KV that needs to be deleted
+					overwritten, err := fnGetLatest(indexGCtx, rawHandle)
+					// if the latest value cannot be found, that means the data KV has been deleted
+					if tikverr.IsErrNotFound(err) {
+						continue
+					}
+					if err != nil {
+						return errors.Trace(err)
+					}
+
+					overwrittenHandle, err := tablecodec.DecodeRowKey(rawHandle)
+					if err != nil {
+						return errors.Trace(err)
+					}
+					decodedData, _, err := tables.DecodeRawRowData(encoder.SessionCtx.GetExprCtx(),
+						tbl.Meta(), overwrittenHandle, tbl.Cols(), overwritten)
+					if err != nil {
+						return errors.Trace(err)
+					}
+					if !tbl.Meta().HasClusteredIndex() {
+						// for nonclustered PK, need to append handle to decodedData for AddRecord
+						decodedData = append(decodedData, types.NewIntDatum(overwrittenHandle.IntValue()))
+					}
+					_, err = encoder.AddRecord(decodedData)
+					if err != nil {
+						return errors.Trace(err)
+					}
+
+					// find out all the KV pairs that are contained in the data KV
+					kvPairs := encoder.SessionCtx.TakeKvPairs()
+
+					for _, kvPair := range kvPairs.Pairs {
+						em.logger.Debug("got encoded KV",
+							logutil.Key("key", kvPair.Key),
+							zap.Binary("value", kvPair.Val),
+							logutil.Key("rawKey", rawKey),
+							zap.Binary("rawValue", rawValue))
+
+						// If rawKey equals to KV pair's key and rawValue equals to KV pair's value,
+						// this latest data KV of the index KV needs to be deleted;
+						// if not, this latest data KV of the index KV was inserted by other rows,
+						// so it is unrelated to the index KV that needs to be deleted, we cannot delete it.
+
+						// An example is:
+						// (pk, uk)
+						// (1, a)
+						// (1, b)
+						// (2, a)
+
+						// (1, a) is overwritten by (2, a). We found a->1 is an overwritten index KV,
+						// and we are considering if its data KV with key "1" can be deleted.
+						// We got the latest value of key "1" which is (1, b),
+						// and encode it to get all KV pairs which is [1->b, b->1].
+						// Only if there is a->1 we dare to delete data KV with key "1".
+
+						if bytes.Equal(kvPair.Key, rawKey) && bytes.Equal(kvPair.Val, rawValue) {
+							handleKeys = append(handleKeys, rawHandle)
+							var insertRow [2][]byte
+							insertRow[0] = rawHandle
+							insertRow[1] = overwritten
+							insertRows = append(insertRows, insertRow)
+							break
+						}
+					}
+				}
+				if err := indexKvRows.Err(); err != nil {
+					_ = indexKvRows.Close()
+					return errors.Trace(err)
+				}
+				if err := indexKvRows.Close(); err != nil {
+					return errors.Trace(err)
+				}
+				if len(handleKeys) == 0 {
+					break
+				}
+				if err := fnDeleteKeys(indexGCtx, handleKeys); err != nil {
+					return errors.Trace(err)
+				}
+				if err := exec.Transact(ctx, "insert data conflict record for conflict detection 'replace' mode",
+					func(c context.Context, txn *sql.Tx) error {
+						sb := &strings.Builder{}
+						_, err2 := common.FprintfWithIdentifiers(sb, insertIntoConflictErrorData, em.schema)
+						if err2 != nil {
+							return errors.Trace(err2)
+						}
+						var sqlArgs []any
+						for i, insertRow := range insertRows {
+							if i > 0 {
+								sb.WriteByte(',')
+							}
+							sb.WriteString(sqlValuesConflictErrorData)
+							sqlArgs = append(sqlArgs,
+								em.taskID,
+								tableName,
+								nil,
+								nil,
+								insertRow[0],
+								insertRow[1],
+								2,
+							)
+						}
+						_, err := txn.ExecContext(c, sb.String(), sqlArgs...)
+						return errors.Trace(err)
+					}); err != nil {
+					return errors.Trace(err)
+				}
+				start = lastRowID + 1
+				// If the remaining tasks cannot be processed at once, split the task
+				// into two subtasks and send one of them to the other idle worker if possible.
+				if end-start > rowLimit {
+					mid := start + (end-start)/2
+					indexTaskWg.Add(1)
+					select {
+					case indexTaskCh <- [2]int64{mid, end}:
+						end = mid
+					default:
+						indexTaskWg.Done()
+					}
+				}
+				handleKeys = handleKeys[:0]
+			}
+			return nil
+		})
+	}
+	if err := indexG.Wait(); err != nil {
+		return errors.Trace(err)
+	}
+
+	dataTaskCh := make(chan [2]int64)
+	dataTaskWg := &sync.WaitGroup{}
+	dataG, dataGCtx := errgroup.WithContext(ctx)
+
+	go func() {
+		//nolint:staticcheck
+		//lint:ignore SA2000
+		dataTaskWg.Add(1)
+		dataTaskCh <- [2]int64{0, math.MaxInt64}
+		dataTaskWg.Wait()
+		close(dataTaskCh)
+	}()
+
+	// check data KV
+	for t := range dataTaskCh {
+		start, end := t[0], t[1]
+		pool.ApplyOnErrorGroup(dataG, func() error {
+			defer dataTaskWg.Done()
+
+			sessionOpts := encode.SessionOptions{
+				// TODO: need to find the correct value for SQLMode
+				SQLMode: mysql.ModeStrictAllTables,
+			}
+			encoder, err := kv.NewBaseKVEncoder(&encode.EncodingConfig{
+				Table:          tbl,
+				SessionOptions: sessionOpts,
+				Logger:         em.logger,
+			})
+			if err != nil {
+				return errors.Trace(err)
+			}
+
+			var handleKeys [][]byte
+			for start < end {
+				dataKvRows, err := em.db.QueryContext(
+					dataGCtx, common.SprintfWithIdentifiers(selectDataConflictKeysReplace, em.schema),
+					tableName, start, end, rowLimit)
+				if err != nil {
+					return errors.Trace(err)
+				}
+
+				var lastRowID int64
+				var previousRawKey, latestValue []byte
+				var mustKeepKvPairs *kv.Pairs
+
+				for dataKvRows.Next() {
+					var rawKey, rawValue []byte
+					if err := dataKvRows.Scan(&lastRowID, &rawKey, &rawValue); err != nil {
+						return errors.Trace(err)
+					}
+					em.logger.Debug("got group raw_key, raw_value from table",
+						logutil.Key("raw_key", rawKey),
+						zap.Binary("raw_value", rawValue))
+
+					if !bytes.Equal(rawKey, previousRawKey) {
+						previousRawKey = rawKey
+						// get the latest value of rawKey from downstream TiDB
+						latestValue, err = fnGetLatest(dataGCtx, rawKey)
+						if err != nil && !tikverr.IsErrNotFound(err) {
+							return errors.Trace(err)
+						}
+						if latestValue != nil {
+							handle, err := tablecodec.DecodeRowKey(rawKey)
+							if err != nil {
+								return errors.Trace(err)
+							}
+							decodedData, _, err := tables.DecodeRawRowData(encoder.SessionCtx.GetExprCtx(),
+								tbl.Meta(), handle, tbl.Cols(), latestValue)
+							if err != nil {
+								return errors.Trace(err)
+							}
+							if !tbl.Meta().HasClusteredIndex() {
+								// for nonclustered PK, need to append handle to decodedData for AddRecord
+								decodedData = append(decodedData, types.NewIntDatum(handle.IntValue()))
+							}
+							_, err = encoder.AddRecord(decodedData)
+							if err != nil {
+								return errors.Trace(err)
+							}
+							// calculate the new mustKeepKvPairs corresponding to the new rawKey
+							// find out all the KV pairs that are contained in the data KV
+							mustKeepKvPairs = encoder.SessionCtx.TakeKvPairs()
+						}
+					}
+
+					// if the latest value of rawKey equals to rawValue, that means this data KV is maintained in downstream TiDB
+					// if not, that means this data KV has been deleted due to overwritten index KV
+					if bytes.Equal(rawValue, latestValue) {
+						continue
+					}
+
+					handle, err := tablecodec.DecodeRowKey(rawKey)
+					if err != nil {
+						return errors.Trace(err)
+					}
+					decodedData, _, err := tables.DecodeRawRowData(encoder.SessionCtx.GetExprCtx(),
+						tbl.Meta(), handle, tbl.Cols(), rawValue)
+					if err != nil {
+						return errors.Trace(err)
+					}
+					if !tbl.Meta().HasClusteredIndex() {
+						// for nonclustered PK, need to append handle to decodedData for AddRecord
+						decodedData = append(decodedData, types.NewIntDatum(handle.IntValue()))
+					}
+					_, err = encoder.AddRecord(decodedData)
+					if err != nil {
+						return errors.Trace(err)
+					}
+
+					// find out all the KV pairs that are contained in the data KV
+					kvPairs := encoder.SessionCtx.TakeKvPairs()
+					for _, kvPair := range kvPairs.Pairs {
+						em.logger.Debug("got encoded KV",
+							logutil.Key("key", kvPair.Key),
+							zap.Binary("value", kvPair.Val))
+						kvLatestValue, err := fnGetLatest(dataGCtx, kvPair.Key)
+						if tikverr.IsErrNotFound(err) {
+							continue
+						}
+						if err != nil {
+							return errors.Trace(err)
+						}
+
+						// if the value of the KV pair is not equal to the latest value of the key of the KV pair
+						// that means the value of the KV pair has been overwritten, so it needs no extra operation
+						if !bytes.Equal(kvLatestValue, kvPair.Val) {
+							continue
+						}
+
+						// if the KV pair is contained in mustKeepKvPairs, we cannot delete it
+						// if not, delete the KV pair
+						if mustKeepKvPairs != nil {
+							isContained := slices.ContainsFunc(mustKeepKvPairs.Pairs, func(mustKeepKvPair common.KvPair) bool {
+								return bytes.Equal(mustKeepKvPair.Key, kvPair.Key) && bytes.Equal(mustKeepKvPair.Val, kvPair.Val)
+							})
+							if isContained {
+								continue
+							}
+						}
+
+						handleKeys = append(handleKeys, kvPair.Key)
+					}
+				}
+				if err := dataKvRows.Err(); err != nil {
+					_ = dataKvRows.Close()
+					return errors.Trace(err)
+				}
+				if err := dataKvRows.Close(); err != nil {
+					return errors.Trace(err)
+				}
+				if len(handleKeys) == 0 {
+					break
+				}
+				if err := fnDeleteKeys(dataGCtx, handleKeys); err != nil {
+					return errors.Trace(err)
+				}
+				start = lastRowID + 1
+				// If the remaining tasks cannot be processed at once, split the task
+				// into two subtasks and send one of them to the other idle worker if possible.
+				if end-start > rowLimit {
+					mid := start + (end-start)/2
+					dataTaskWg.Add(1)
+					select {
+					case dataTaskCh <- [2]int64{mid, end}:
+						end = mid
+					default:
+						dataTaskWg.Done()
+					}
+				}
+				handleKeys = handleKeys[:0]
+			}
+			return nil
+		})
+	}
+	if err := dataG.Wait(); err != nil {
+		return errors.Trace(err)
+	}
+
+	hasRow := true
+	for {
+		// delete the additionally inserted rows for nonclustered PK
+		if err := exec.Transact(ctx, "delete additionally inserted rows for conflict detection 'replace' mode",
+			func(c context.Context, txn *sql.Tx) error {
+				sb := &strings.Builder{}
+				_, err2 := common.FprintfWithIdentifiers(sb, deleteNullDataRow, em.schema)
+				if err2 != nil {
+					return errors.Trace(err2)
+				}
+				result, err := txn.ExecContext(c, sb.String(), rowLimit)
+				if err != nil {
+					return errors.Trace(err)
+				}
+				affected, err := result.RowsAffected()
+				if err != nil {
+					return errors.Trace(err)
+				}
+				if affected == 0 {
+					hasRow = false
+				}
+				return nil
+			}); err != nil {
+			return errors.Trace(err)
+		}
+		if !hasRow {
+			break
+		}
+	}
+
+	return nil
+}
+
+// RecordDuplicateCount reduce the counter of "duplicate entry" errors.
+// Currently, the count will not be shared for multiple lightning instances.
+func (em *ErrorManager) RecordDuplicateCount(cnt int64) error {
+	if em.conflictErrRemain.Sub(cnt) < 0 {
+		threshold := em.configConflict.Threshold
+		return errors.Errorf(
+			"The number of conflict errors exceeds the threshold configured by `conflict.threshold`: '%d'",
+			threshold)
+	}
+	return nil
+}
+
+// RecordDuplicate records a "duplicate entry" error so user can query them later.
+// Currently, the error will not be shared for multiple lightning instances.
+func (em *ErrorManager) RecordDuplicate(
+	ctx context.Context,
+	logger log.Logger,
+	tableName string,
+	path string,
+	offset int64,
+	errMsg string,
+	rowID int64,
+	rowData string,
+) error {
+	if em.conflictErrRemain.Dec() < 0 {
+		threshold := em.configConflict.Threshold
+		return errors.Errorf(
+			"The number of conflict errors exceeds the threshold configured by `conflict.threshold`: '%d'",
+			threshold)
+	}
+	if em.db == nil {
+		return nil
+	}
+	if em.conflictRecordsRemain.Add(-1) < 0 {
+		return nil
+	}
+
+	return em.recordDuplicate(ctx, logger, tableName, path, offset, errMsg, rowID, rowData)
+}
+
+func (em *ErrorManager) recordDuplicate(
+	ctx context.Context,
+	logger log.Logger,
+	tableName string,
+	path string,
+	offset int64,
+	errMsg string,
+	rowID int64,
+	rowData string,
+) error {
+	exec := common.SQLWithRetry{
+		DB:           em.db,
+		Logger:       logger,
+		HideQueryLog: redact.NeedRedact(),
+	}
+	return exec.Exec(ctx, "insert duplicate record",
+		common.SprintfWithIdentifiers(insertIntoDupRecord, em.schema),
+		em.taskID,
+		tableName,
+		path,
+		offset,
+		errMsg,
+		rowID,
+		rowData,
+	)
+}
+
+// RecordDuplicateOnce records a "duplicate entry" error so user can query them later.
+// Currently the error will not be shared for multiple lightning instances.
+// Different from RecordDuplicate, this function is used when conflict.strategy
+// is "error" and will only write the first conflict error to the table.
+func (em *ErrorManager) RecordDuplicateOnce(
+	ctx context.Context,
+	logger log.Logger,
+	tableName string,
+	path string,
+	offset int64,
+	errMsg string,
+	rowID int64,
+	rowData string,
+) {
+	ok := em.recordErrorOnce.CompareAndSwap(false, true)
+	if !ok {
+		return
+	}
+	err := em.recordDuplicate(ctx, logger, tableName, path, offset, errMsg, rowID, rowData)
+	if err != nil {
+		logger.Warn("meet error when record duplicate entry error", zap.Error(err))
+	}
+}
+
+func (em *ErrorManager) errorCount(typeVal func(*config.MaxError) int64) int64 {
+	cfgVal := typeVal(em.configError)
+	val := typeVal(&em.remainingError)
+	if val < 0 {
+		val = 0
+	}
+	return cfgVal - val
+}
+
+func (em *ErrorManager) typeErrors() int64 {
+	return em.errorCount(func(maxError *config.MaxError) int64 {
+		return maxError.Type.Load()
+	})
+}
+
+func (em *ErrorManager) syntaxError() int64 {
+	return em.errorCount(func(maxError *config.MaxError) int64 {
+		return maxError.Syntax.Load()
+	})
+}
+
+func (em *ErrorManager) conflictError() int64 {
+	val := em.conflictErrRemain.Load()
+	if val < 0 {
+		val = 0
+	}
+	return em.configConflict.Threshold - val
+}
+
+func (em *ErrorManager) charsetError() int64 {
+	return em.errorCount(func(maxError *config.MaxError) int64 {
+		return maxError.Charset.Load()
+	})
+}
+
+// HasError returns true if any error type has reached the limit
+func (em *ErrorManager) HasError() bool {
+	return em.typeErrors() > 0 || em.syntaxError() > 0 ||
+		em.charsetError() > 0 || em.conflictError() > 0
+}
+
+// LogErrorDetails return a slice of zap.Field for each error type
+func (em *ErrorManager) LogErrorDetails() {
+	fmtErrMsg := func(cnt int64, errType, tblName string) string {
+		return fmt.Sprintf("Detect %d %s errors in total, please refer to table %s for more details",
+			cnt, errType, em.fmtTableName(tblName))
+	}
+	if errCnt := em.typeErrors(); errCnt > 0 {
+		em.logger.Warn(fmtErrMsg(errCnt, "data type", typeErrorTableName))
+	}
+	if errCnt := em.syntaxError(); errCnt > 0 {
+		em.logger.Warn(fmtErrMsg(errCnt, "data syntax", syntaxErrorTableName))
+	}
+	if errCnt := em.charsetError(); errCnt > 0 {
+		// TODO: add charset table name
+		em.logger.Warn(fmtErrMsg(errCnt, "data charset", ""))
+	}
+	errCnt := em.conflictError()
+	if errCnt > 0 && (em.conflictV1Enabled || em.conflictV2Enabled) {
+		em.logger.Warn(fmtErrMsg(errCnt, "conflict", ConflictViewName))
+	}
+}
+
+func (em *ErrorManager) fmtTableName(t string) string {
+	return common.UniqueTable(em.schema, t)
+}
+
+// Output renders a table which contains error summery for each error type.
+func (em *ErrorManager) Output() string {
+	if !em.HasError() {
+		return ""
+	}
+
+	t := table.NewWriter()
+	t.AppendHeader(table.Row{"#", "Error Type", "Error Count", "Error Data Table"})
+	t.SetColumnConfigs([]table.ColumnConfig{
+		{Name: "#"},
+		{Name: "Error Type"},
+		{Name: "Error Count"},
+		{Name: "Error Data Table"},
+	})
+	t.SetRowPainter(func(table.Row) text.Colors {
+		return text.Colors{text.FgRed}
+	})
+
+	count := 0
+	if errCnt := em.typeErrors(); errCnt > 0 {
+		count++
+		t.AppendRow(table.Row{count, "Data Type", errCnt, em.fmtTableName(typeErrorTableName)})
+	}
+	if errCnt := em.syntaxError(); errCnt > 0 {
+		count++
+		t.AppendRow(table.Row{count, "Data Syntax", errCnt, em.fmtTableName(syntaxErrorTableName)})
+	}
+	if errCnt := em.charsetError(); errCnt > 0 {
+		count++
+		// do not support record charset error now.
+		t.AppendRow(table.Row{count, "Charset Error", errCnt, ""})
+	}
+	if errCnt := em.conflictError(); errCnt > 0 {
+		count++
+		if em.conflictV1Enabled || em.conflictV2Enabled {
+			t.AppendRow(table.Row{count, "Unique Key Conflict", errCnt, em.fmtTableName(ConflictViewName)})
+		}
+	}
+
+	res := "\nImport Data Error Summary: \n"
+	res += t.Render()
+	res += "\n"
+
+	return res
+}
diff --git a/pkg/lightning/errormanager/errormanager_test.go b/pkg/lightning/errormanager/errormanager_test.go
new file mode 100644
index 0000000000000..7b02b2772a77e
--- /dev/null
+++ b/pkg/lightning/errormanager/errormanager_test.go
@@ -0,0 +1,724 @@
+// Copyright 2021 PingCAP, Inc.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package errormanager
+
+import (
+	"bytes"
+	"context"
+	"database/sql/driver"
+	"fmt"
+	"io"
+	"testing"
+
+	"github.com/DATA-DOG/go-sqlmock"
+	"github.com/pingcap/tidb/pkg/lightning/backend/encode"
+	tidbkv "github.com/pingcap/tidb/pkg/lightning/backend/kv"
+	"github.com/pingcap/tidb/pkg/lightning/config"
+	"github.com/pingcap/tidb/pkg/lightning/log"
+	"github.com/pingcap/tidb/pkg/meta/model"
+	pmodel "github.com/pingcap/tidb/pkg/parser/model"
+	"github.com/pingcap/tidb/pkg/parser/mysql"
+	"github.com/pingcap/tidb/pkg/table/tables"
+	"github.com/pingcap/tidb/pkg/types"
+	"github.com/pingcap/tidb/pkg/util"
+	"github.com/stretchr/testify/require"
+	"go.uber.org/atomic"
+)
+
+func TestInit(t *testing.T) {
+	db, mock, err := sqlmock.New()
+	require.NoError(t, err)
+
+	cfg := config.NewConfig()
+	cfg.TikvImporter.Backend = config.BackendLocal
+	cfg.TikvImporter.DuplicateResolution = config.NoneOnDup
+	cfg.Conflict.Strategy = config.ReplaceOnDup
+	cfg.Conflict.PrecheckConflictBeforeImport = true
+	cfg.App.MaxError.Type.Store(10)
+	cfg.Conflict.Threshold = 20
+	cfg.App.TaskInfoSchemaName = "lightning_errors"
+
+	em := New(db, cfg, log.L())
+	require.True(t, em.conflictV1Enabled)
+	require.True(t, em.conflictV2Enabled)
+	require.Equal(t, cfg.App.MaxError.Type.Load(), em.remainingError.Type.Load())
+	require.Equal(t, cfg.Conflict.Threshold, em.conflictErrRemain.Load())
+
+	em.remainingError.Type.Store(0)
+	em.conflictV1Enabled = false
+	em.conflictV2Enabled = false
+	ctx := context.Background()
+	err = em.Init(ctx)
+	require.NoError(t, err)
+
+	em.conflictV1Enabled = true
+	mock.ExpectExec("CREATE SCHEMA IF NOT EXISTS `lightning_errors`;").
+		WillReturnResult(sqlmock.NewResult(1, 1))
+	mock.ExpectExec("CREATE TABLE IF NOT EXISTS `lightning_errors`\\.conflict_error_v4.*").
+		WillReturnResult(sqlmock.NewResult(2, 1))
+	mock.ExpectExec("CREATE OR REPLACE VIEW `lightning_errors`\\.conflict_view.*").
+		WillReturnResult(sqlmock.NewResult(3, 1))
+	err = em.Init(ctx)
+	require.NoError(t, err)
+	require.NoError(t, mock.ExpectationsWereMet())
+
+	em.conflictV2Enabled = true
+	em.remainingError.Type.Store(1)
+	mock.ExpectExec("CREATE SCHEMA IF NOT EXISTS `lightning_errors`.*").
+		WillReturnResult(sqlmock.NewResult(5, 1))
+	mock.ExpectExec("CREATE TABLE IF NOT EXISTS `lightning_errors`\\.type_error_v2.*").
+		WillReturnResult(sqlmock.NewResult(6, 1))
+	mock.ExpectExec("CREATE TABLE IF NOT EXISTS `lightning_errors`\\.conflict_error_v4.*").
+		WillReturnResult(sqlmock.NewResult(7, 1))
+	mock.ExpectExec("CREATE TABLE IF NOT EXISTS `lightning_errors`\\.conflict_records_v2.*").
+		WillReturnResult(sqlmock.NewResult(7, 1))
+	mock.ExpectExec("CREATE OR REPLACE VIEW `lightning_errors`\\.conflict_view.*").
+		WillReturnResult(sqlmock.NewResult(7, 1))
+	err = em.Init(ctx)
+	require.NoError(t, err)
+	require.NoError(t, mock.ExpectationsWereMet())
+}
+
+type mockDriver struct {
+	driver.Driver
+	totalRows int64
+}
+
+func (m mockDriver) Open(_ string) (driver.Conn, error) {
+	return mockConn{totalRows: m.totalRows}, nil
+}
+
+type mockConn struct {
+	driver.Conn
+	driver.ExecerContext
+	driver.QueryerContext
+	totalRows int64
+}
+
+func (c mockConn) ExecContext(_ context.Context, _ string, _ []driver.NamedValue) (driver.Result, error) {
+	return sqlmock.NewResult(1, 1), nil
+}
+
+func (mockConn) Close() error { return nil }
+
+type mockRows struct {
+	driver.Rows
+	start int64
+	end   int64
+}
+
+func (r *mockRows) Columns() []string {
+	return []string{"id", "raw_handle", "raw_row"}
+}
+
+func (r *mockRows) Close() error { return nil }
+
+func (r *mockRows) Next(dest []driver.Value) error {
+	if r.start >= r.end {
+		return io.EOF
+	}
+	dest[0] = r.start  // id
+	dest[1] = []byte{} // raw_handle
+	dest[2] = []byte{} // raw_row
+	r.start++
+	return nil
+}
+
+func (c mockConn) QueryContext(_ context.Context, query string, args []driver.NamedValue) (driver.Rows, error) {
+	expectedQuery := "SELECT id, raw_handle, raw_row.*"
+	if err := sqlmock.QueryMatcherRegexp.Match(expectedQuery, query); err != nil {
+		return &mockRows{}, nil
+	}
+	if len(args) != 4 {
+		return &mockRows{}, nil
+	}
+	// args are tableName, start, end, and limit.
+	start := args[1].Value.(int64)
+	if start < 1 {
+		start = 1
+	}
+	end := args[2].Value.(int64)
+	if end > c.totalRows+1 {
+		end = c.totalRows + 1
+	}
+	limit := args[3].Value.(int64)
+	if start+limit < end {
+		end = start + limit
+	}
+	return &mockRows{start: start, end: end}, nil
+}
+
+func TestReplaceConflictOneKey(t *testing.T) {
+	column1 := &model.ColumnInfo{
+		ID:           1,
+		Name:         pmodel.NewCIStr("a"),
+		Offset:       0,
+		DefaultValue: 0,
+		FieldType:    *types.NewFieldType(mysql.TypeLong),
+		Hidden:       true,
+		State:        model.StatePublic,
+	}
+	column1.AddFlag(mysql.PriKeyFlag)
+
+	column2 := &model.ColumnInfo{
+		ID:           2,
+		Name:         pmodel.NewCIStr("b"),
+		Offset:       1,
+		DefaultValue: 0,
+		FieldType:    *types.NewFieldType(mysql.TypeLong),
+		Hidden:       true,
+		State:        model.StatePublic,
+	}
+
+	column3 := &model.ColumnInfo{
+		ID:           3,
+		Name:         pmodel.NewCIStr("c"),
+		Offset:       2,
+		DefaultValue: 0,
+		FieldType:    *types.NewFieldType(mysql.TypeBlob),
+		Hidden:       true,
+		State:        model.StatePublic,
+	}
+
+	index := &model.IndexInfo{
+		ID:    1,
+		Name:  pmodel.NewCIStr("key_b"),
+		Table: pmodel.NewCIStr(""),
+		Columns: []*model.IndexColumn{
+			{
+				Name:   pmodel.NewCIStr("b"),
+				Offset: 1,
+				Length: -1,
+			}},
+		Unique:  false,
+		Primary: false,
+		State:   model.StatePublic,
+	}
+
+	table := &model.TableInfo{
+		ID:         104,
+		Name:       pmodel.NewCIStr("a"),
+		Charset:    "utf8mb4",
+		Collate:    "utf8mb4_bin",
+		Columns:    []*model.ColumnInfo{column1, column2, column3},
+		Indices:    []*model.IndexInfo{index},
+		PKIsHandle: true,
+		State:      model.StatePublic,
+	}
+
+	tbl, err := tables.TableFromMeta(tidbkv.NewPanickingAllocators(table.SepAutoInc()), table)
+	require.NoError(t, err)
+
+	sessionOpts := encode.SessionOptions{
+		SQLMode:   mysql.ModeStrictAllTables,
+		Timestamp: 1234567890,
+	}
+
+	encoder, err := tidbkv.NewBaseKVEncoder(&encode.EncodingConfig{
+		Table:          tbl,
+		SessionOptions: sessionOpts,
+		Logger:         log.L(),
+	})
+	require.NoError(t, err)
+	encoder.SessionCtx.GetTableCtx().GetRowEncodingConfig().RowEncoder.Enable = true
+
+	data1 := []types.Datum{
+		types.NewIntDatum(1),
+		types.NewIntDatum(6),
+		types.NewStringDatum("1.csv"),
+	}
+	data2 := []types.Datum{
+		types.NewIntDatum(2),
+		types.NewIntDatum(6),
+		types.NewStringDatum("2.csv"),
+	}
+	data3 := []types.Datum{
+		types.NewIntDatum(3),
+		types.NewIntDatum(3),
+		types.NewStringDatum("3.csv"),
+	}
+	data4 := []types.Datum{
+		types.NewIntDatum(3),
+		types.NewIntDatum(4),
+		types.NewStringDatum("4.csv"),
+	}
+	data5 := []types.Datum{
+		types.NewIntDatum(5),
+		types.NewIntDatum(4),
+		types.NewStringDatum("5.csv"),
+	}
+	_, err = encoder.AddRecord(data1)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data2)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data3)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data4)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data5)
+	require.NoError(t, err)
+	kvPairs := encoder.SessionCtx.TakeKvPairs()
+
+	data1IndexKey := kvPairs.Pairs[7].Key
+	data1IndexValue := kvPairs.Pairs[7].Val
+	data1RowKey := kvPairs.Pairs[4].Key
+	data1RowValue := kvPairs.Pairs[4].Val
+	data2RowValue := kvPairs.Pairs[6].Val
+
+	db, mockDB, err := sqlmock.New()
+	require.NoError(t, err)
+	defer func() {
+		_ = db.Close()
+	}()
+
+	ctx, cancel := context.WithCancel(context.Background())
+	defer cancel()
+
+	mockDB.ExpectExec("CREATE SCHEMA IF NOT EXISTS `lightning_task_info`").
+		WillReturnResult(sqlmock.NewResult(1, 1))
+	mockDB.ExpectExec("CREATE TABLE IF NOT EXISTS `lightning_task_info`\\.conflict_error_v4.*").
+		WillReturnResult(sqlmock.NewResult(2, 1))
+	mockDB.ExpectExec("CREATE OR REPLACE VIEW `lightning_task_info`\\.conflict_view.*").
+		WillReturnResult(sqlmock.NewResult(3, 1))
+	mockDB.ExpectQuery("\\QSELECT id, raw_key, index_name, raw_value, raw_handle FROM `lightning_task_info`.conflict_error_v4 WHERE table_name = ? AND kv_type = 0 AND id >= ? and id < ? ORDER BY id LIMIT ?\\E").
+		WillReturnRows(sqlmock.NewRows([]string{"id", "raw_key", "index_name", "raw_value", "raw_handle"}))
+	mockDB.ExpectQuery("\\QSELECT id, raw_key, raw_value FROM `lightning_task_info`.conflict_error_v4 WHERE table_name = ? AND kv_type <> 0 AND id >= ? and id < ? ORDER BY id LIMIT ?\\E").
+		WillReturnRows(sqlmock.NewRows([]string{"id", "raw_key", "raw_value"}).
+			AddRow(1, data1RowKey, data1RowValue).
+			AddRow(2, data1RowKey, data2RowValue))
+	for i := 0; i < 2; i++ {
+		mockDB.ExpectQuery("\\QSELECT id, raw_key, raw_value FROM `lightning_task_info`.conflict_error_v4 WHERE table_name = ? AND kv_type <> 0 AND id >= ? and id < ? ORDER BY id LIMIT ?\\E").
+			WillReturnRows(sqlmock.NewRows([]string{"id", "raw_key", "raw_value"}))
+	}
+	mockDB.ExpectBegin()
+	mockDB.ExpectExec("DELETE FROM `lightning_task_info`\\.conflict_error_v4.*").
+		WillReturnResult(sqlmock.NewResult(0, 0))
+	mockDB.ExpectCommit()
+
+	cfg := config.NewConfig()
+	cfg.Conflict.Strategy = config.ReplaceOnDup
+	cfg.TikvImporter.Backend = config.BackendLocal
+	cfg.App.TaskInfoSchemaName = "lightning_task_info"
+	em := New(db, cfg, log.L())
+	err = em.Init(ctx)
+	require.NoError(t, err)
+
+	fnGetLatestCount := atomic.NewInt32(0)
+	fnDeleteKeyCount := atomic.NewInt32(0)
+	pool := util.NewWorkerPool(16, "resolve duplicate rows by replace")
+	err = em.ReplaceConflictKeys(
+		ctx, tbl, "test", pool,
+		func(ctx context.Context, key []byte) ([]byte, error) {
+			fnGetLatestCount.Add(1)
+			switch {
+			case bytes.Equal(key, data1IndexKey):
+				return data1IndexValue, nil
+			case bytes.Equal(key, data1RowKey):
+				return data1RowValue, nil
+			default:
+				return nil, fmt.Errorf("key %v is not expected", key)
+			}
+		},
+		func(ctx context.Context, keys [][]byte) error {
+			fnDeleteKeyCount.Add(int32(len(keys)))
+			for _, key := range keys {
+				if !bytes.Equal(key, data1IndexKey) {
+					return fmt.Errorf("key %v is not expected", key)
+				}
+			}
+			return nil
+		},
+	)
+	require.NoError(t, err)
+	require.Equal(t, int32(3), fnGetLatestCount.Load())
+	require.Equal(t, int32(1), fnDeleteKeyCount.Load())
+	err = mockDB.ExpectationsWereMet()
+	require.NoError(t, err)
+}
+
+func TestReplaceConflictOneUniqueKey(t *testing.T) {
+	column1 := &model.ColumnInfo{
+		ID:           1,
+		Name:         pmodel.NewCIStr("a"),
+		Offset:       0,
+		DefaultValue: 0,
+		FieldType:    *types.NewFieldType(mysql.TypeLong),
+		Hidden:       true,
+		State:        model.StatePublic,
+	}
+	column1.AddFlag(mysql.PriKeyFlag)
+
+	column2 := &model.ColumnInfo{
+		ID:           2,
+		Name:         pmodel.NewCIStr("b"),
+		Offset:       1,
+		DefaultValue: 0,
+		FieldType:    *types.NewFieldType(mysql.TypeLong),
+		Hidden:       true,
+		State:        model.StatePublic,
+	}
+	column2.AddFlag(mysql.UniqueKeyFlag)
+
+	column3 := &model.ColumnInfo{
+		ID:           3,
+		Name:         pmodel.NewCIStr("c"),
+		Offset:       2,
+		DefaultValue: 0,
+		FieldType:    *types.NewFieldType(mysql.TypeBlob),
+		Hidden:       true,
+		State:        model.StatePublic,
+	}
+
+	index := &model.IndexInfo{
+		ID:    1,
+		Name:  pmodel.NewCIStr("uni_b"),
+		Table: pmodel.NewCIStr(""),
+		Columns: []*model.IndexColumn{
+			{
+				Name:   pmodel.NewCIStr("b"),
+				Offset: 1,
+				Length: -1,
+			}},
+		Unique:  true,
+		Primary: false,
+		State:   model.StatePublic,
+	}
+
+	table := &model.TableInfo{
+		ID:         104,
+		Name:       pmodel.NewCIStr("a"),
+		Charset:    "utf8mb4",
+		Collate:    "utf8mb4_bin",
+		Columns:    []*model.ColumnInfo{column1, column2, column3},
+		Indices:    []*model.IndexInfo{index},
+		PKIsHandle: true,
+		State:      model.StatePublic,
+	}
+
+	tbl, err := tables.TableFromMeta(tidbkv.NewPanickingAllocators(table.SepAutoInc()), table)
+	require.NoError(t, err)
+
+	sessionOpts := encode.SessionOptions{
+		SQLMode:   mysql.ModeStrictAllTables,
+		Timestamp: 1234567890,
+	}
+
+	encoder, err := tidbkv.NewBaseKVEncoder(&encode.EncodingConfig{
+		Table:          tbl,
+		SessionOptions: sessionOpts,
+		Logger:         log.L(),
+	})
+	require.NoError(t, err)
+	encoder.SessionCtx.GetTableCtx().GetRowEncodingConfig().RowEncoder.Enable = true
+
+	data1 := []types.Datum{
+		types.NewIntDatum(1),
+		types.NewIntDatum(6),
+		types.NewStringDatum("1.csv"),
+	}
+	data2 := []types.Datum{
+		types.NewIntDatum(2),
+		types.NewIntDatum(6),
+		types.NewStringDatum("2.csv"),
+	}
+	data3 := []types.Datum{
+		types.NewIntDatum(3),
+		types.NewIntDatum(3),
+		types.NewStringDatum("3.csv"),
+	}
+	data4 := []types.Datum{
+		types.NewIntDatum(3),
+		types.NewIntDatum(4),
+		types.NewStringDatum("4.csv"),
+	}
+	data5 := []types.Datum{
+		types.NewIntDatum(5),
+		types.NewIntDatum(4),
+		types.NewStringDatum("5.csv"),
+	}
+	_, err = encoder.AddRecord(data1)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data2)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data3)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data4)
+	require.NoError(t, err)
+	_, err = encoder.AddRecord(data5)
+	require.NoError(t, err)
+	kvPairs := encoder.SessionCtx.TakeKvPairs()
+
+	data1IndexKey := kvPairs.Pairs[7].Key
+	data3IndexKey := kvPairs.Pairs[1].Key
+	data1IndexValue := kvPairs.Pairs[7].Val
+	data2IndexValue := kvPairs.Pairs[9].Val
+	data3IndexValue := kvPairs.Pairs[1].Val
+	data4IndexValue := kvPairs.Pairs[3].Val
+	data1RowKey := kvPairs.Pairs[4].Key
+	data2RowKey := kvPairs.Pairs[8].Key
+	data3RowKey := kvPairs.Pairs[0].Key
+	data4RowKey := kvPairs.Pairs[2].Key
+	data1RowValue := kvPairs.Pairs[4].Val
+	data2RowValue := kvPairs.Pairs[8].Val
+	data3RowValue := kvPairs.Pairs[6].Val
+	data4RowValue := kvPairs.Pairs[2].Val
+
+	db, mockDB, err := sqlmock.New()
+	require.NoError(t, err)
+	defer func() {
+		_ = db.Close()
+	}()
+
+	ctx, cancel := context.WithCancel(context.Background())
+	defer cancel()
+
+	mockDB.ExpectExec("CREATE SCHEMA IF NOT EXISTS `lightning_task_info`").
+		WillReturnResult(sqlmock.NewResult(1, 1))
+	mockDB.ExpectExec("CREATE TABLE IF NOT EXISTS `lightning_task_info`\\.conflict_error_v4.*").
+		WillReturnResult(sqlmock.NewResult(2, 1))
+	mockDB.ExpectExec("CREATE OR REPLACE VIEW `lightning_task_info`\\.conflict_view.*").
+		WillReturnResult(sqlmock.NewResult(3, 1))
+	mockDB.ExpectQuery("\\QSELECT id, raw_key, index_name, raw_value, raw_handle FROM `lightning_task_info`.conflict_error_v4 WHERE table_name = ? AND kv_type = 0 AND id >= ? and id < ? ORDER BY id LIMIT ?\\E").
+		WillReturnRows(sqlmock.NewRows([]string{"id", "raw_key", "index_name", "raw_value", "raw_handle"}).
+			AddRow(1, data1IndexKey, "uni_b", data1IndexValue, data1RowKey).
+			AddRow(2, data1IndexKey, "uni_b", data2IndexValue, data2RowKey).
+			AddRow(3, data3IndexKey, "uni_b", data3IndexValue, data3RowKey).
+			AddRow(4, data3IndexKey, "uni_b", data4IndexValue, data4RowKey))
+	mockDB.ExpectBegin()
+	mockDB.ExpectExec("INSERT INTO `lightning_task_info`\\.conflict_error_v4.*").
+		WithArgs(0, "test", nil, nil, data2RowKey, data2RowValue, 2,
+			0, "test", nil, nil, data4RowKey, data4RowValue, 2).
+		WillReturnResult(driver.ResultNoRows)
+	mockDB.ExpectCommit()
+	for i := 0; i < 2; i++ {
+		mockDB.ExpectQuery("\\QSELECT id, raw_key, index_name, raw_value, raw_handle FROM `lightning_task_info`.conflict_error_v4 WHERE table_name = ? AND kv_type = 0 AND id >= ? and id < ? ORDER BY id LIMIT ?\\E").
+			WillReturnRows(sqlmock.NewRows([]string{"id", "raw_key", "index_name", "raw_value", "raw_handle"}))
+	}
+	mockDB.ExpectQuery("\\QSELECT id, raw_key, raw_value FROM `lightning_task_info`.conflict_error_v4 WHERE table_name = ? AND kv_type <> 0 AND id >= ? and id < ? ORDER BY id LIMIT ?\\E").
+		WillReturnRows(sqlmock.NewRows([]string{"id", "raw_key", "raw_value"}).
+			AddRow(1, data1RowKey, data1RowValue).
+			AddRow(2, data1RowKey, data3RowValue))
+	for i := 0; i < 2; i++ {
+		mockDB.ExpectQuery("\\QSELECT id, raw_key, raw_value FROM `lightning_task_info`.conflict_error_v4 WHERE table_name = ? AND kv_type <> 0 AND id >= ? and id < ? ORDER BY id LIMIT ?\\E").
+			WillReturnRows(sqlmock.NewRows([]string{"id", "raw_key", "raw_value"}))
+	}
+	mockDB.ExpectBegin()
+	mockDB.ExpectExec("DELETE FROM `lightning_task_info`\\.conflict_error_v4.*").
+		WillReturnResult(sqlmock.NewResult(0, 2))
+	mockDB.ExpectCommit()
+	mockDB.ExpectBegin()
+	mockDB.ExpectExec("DELETE FROM `lightning_task_info`\\.conflict_error_v4.*").
+		WillReturnResult(sqlmock.NewResult(0, 0))
+	mockDB.ExpectCommit()
+
+	cfg := config.NewConfig()
+	cfg.Conflict.Strategy = config.ReplaceOnDup
+	cfg.TikvImporter.Backend = config.BackendLocal
+	cfg.App.TaskInfoSchemaName = "lightning_task_info"
+	em := New(db, cfg, log.L())
+	err = em.Init(ctx)
+	require.NoError(t, err)
+
+	fnGetLatestCount := atomic.NewInt32(0)
+	fnDeleteKeyCount := atomic.NewInt32(0)
+	pool := util.NewWorkerPool(16, "resolve duplicate rows by replace")
+	err = em.ReplaceConflictKeys(
+		ctx, tbl, "test", pool,
+		func(ctx context.Context, key []byte) ([]byte, error) {
+			fnGetLatestCount.Add(1)
+			switch {
+			case bytes.Equal(key, data1IndexKey):
+				return data1IndexValue, nil
+			case bytes.Equal(key, data3IndexKey):
+				return data3IndexValue, nil
+			case bytes.Equal(key, data1RowKey):
+				return data1RowValue, nil
+			case bytes.Equal(key, data2RowKey):
+				return data2RowValue, nil
+			case bytes.Equal(key, data4RowKey):
+				return data4RowValue, nil
+			default:
+				return nil, fmt.Errorf("key %v is not expected", key)
+			}
+		},
+		func(ctx context.Context, keys [][]byte) error {
+			fnDeleteKeyCount.Add(int32(len(keys)))
+			for _, key := range keys {
+				if !bytes.Equal(key, data1IndexKey) && !bytes.Equal(key, data2RowKey) && !bytes.Equal(key, data4RowKey) {
+					return fmt.Errorf("key %v is not expected", key)
+				}
+			}
+			return nil
+		},
+	)
+	require.NoError(t, err)
+	require.Equal(t, int32(9), fnGetLatestCount.Load())
+	require.Equal(t, int32(3), fnDeleteKeyCount.Load())
+	err = mockDB.ExpectationsWereMet()
+	require.NoError(t, err)
+}
+
+func TestErrorMgrHasError(t *testing.T) {
+	cfg := &config.Config{}
+	cfg.App.MaxError = config.MaxError{
+		Syntax:  *atomic.NewInt64(100),
+		Charset: *atomic.NewInt64(100),
+		Type:    *atomic.NewInt64(100),
+	}
+	cfg.Conflict.Threshold = 100
+	em := &ErrorManager{
+		configError:       &cfg.App.MaxError,
+		remainingError:    cfg.App.MaxError,
+		configConflict:    &cfg.Conflict,
+		conflictErrRemain: atomic.NewInt64(100),
+	}
+
+	// no field changes, should return false
+	require.False(t, em.HasError())
+
+	// change single field
+	em.remainingError.Syntax.Sub(1)
+	require.True(t, em.HasError())
+
+	em.remainingError = cfg.App.MaxError
+	em.remainingError.Charset.Sub(1)
+	require.True(t, em.HasError())
+
+	em.remainingError = cfg.App.MaxError
+	em.remainingError.Type.Sub(1)
+	require.True(t, em.HasError())
+
+	em.remainingError = cfg.App.MaxError
+	em.conflictErrRemain.Sub(1)
+	require.True(t, em.HasError())
+
+	// change multiple keys
+	em.remainingError = cfg.App.MaxError
+	em.remainingError.Syntax.Store(0)
+	em.remainingError.Charset.Store(0)
+	em.remainingError.Type.Store(0)
+	em.conflictErrRemain.Store(0)
+	require.True(t, em.HasError())
+}
+
+func TestErrorMgrErrorOutput(t *testing.T) {
+	cfg := &config.Config{}
+	cfg.App.MaxError = config.MaxError{
+		Syntax:  *atomic.NewInt64(100),
+		Charset: *atomic.NewInt64(100),
+		Type:    *atomic.NewInt64(100),
+	}
+	cfg.Conflict.Threshold = 100
+
+	em := &ErrorManager{
+		configError:       &cfg.App.MaxError,
+		remainingError:    cfg.App.MaxError,
+		configConflict:    &cfg.Conflict,
+		conflictErrRemain: atomic.NewInt64(100),
+		schema:            "error_info",
+		conflictV1Enabled: true,
+	}
+
+	output := em.Output()
+	require.Equal(t, output, "")
+
+	em.remainingError.Syntax.Sub(1)
+	output = em.Output()
+	expected := "\n" +
+		"Import Data Error Summary: \n" +
+		"+---+-------------+-------------+--------------------------------+\n" +
+		"| # | ERROR TYPE  | ERROR COUNT | ERROR DATA TABLE               |\n" +
+		"+---+-------------+-------------+--------------------------------+\n" +
+		"|\x1b[31m 1 \x1b[0m|\x1b[31m Data Syntax \x1b[0m|\x1b[31m           1 \x1b[0m|\x1b[31m `error_info`.`syntax_error_v2` \x1b[0m|\n" +
+		"+---+-------------+-------------+--------------------------------+\n"
+	require.Equal(t, expected, output)
+
+	em.remainingError = cfg.App.MaxError
+	em.remainingError.Syntax.Sub(10)
+	em.remainingError.Type.Store(10)
+	output = em.Output()
+	expected = "\n" +
+		"Import Data Error Summary: \n" +
+		"+---+-------------+-------------+--------------------------------+\n" +
+		"| # | ERROR TYPE  | ERROR COUNT | ERROR DATA TABLE               |\n" +
+		"+---+-------------+-------------+--------------------------------+\n" +
+		"|\x1b[31m 1 \x1b[0m|\x1b[31m Data Type   \x1b[0m|\x1b[31m          90 \x1b[0m|\x1b[31m `error_info`.`type_error_v2`   \x1b[0m|\n" +
+		"|\x1b[31m 2 \x1b[0m|\x1b[31m Data Syntax \x1b[0m|\x1b[31m          10 \x1b[0m|\x1b[31m `error_info`.`syntax_error_v2` \x1b[0m|\n" +
+		"+---+-------------+-------------+--------------------------------+\n"
+	require.Equal(t, expected, output)
+
+	// change multiple keys
+	em.remainingError = cfg.App.MaxError
+	em.remainingError.Syntax.Store(0)
+	em.remainingError.Charset.Store(0)
+	em.remainingError.Type.Store(0)
+	em.conflictErrRemain.Store(0)
+	output = em.Output()
+	expected = "\n" +
+		"Import Data Error Summary: \n" +
+		"+---+---------------------+-------------+--------------------------------+\n" +
+		"| # | ERROR TYPE          | ERROR COUNT | ERROR DATA TABLE               |\n" +
+		"+---+---------------------+-------------+--------------------------------+\n" +
+		"|\x1b[31m 1 \x1b[0m|\x1b[31m Data Type           \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`type_error_v2`   \x1b[0m|\n" +
+		"|\x1b[31m 2 \x1b[0m|\x1b[31m Data Syntax         \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`syntax_error_v2` \x1b[0m|\n" +
+		"|\x1b[31m 3 \x1b[0m|\x1b[31m Charset Error       \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m                                \x1b[0m|\n" +
+		"|\x1b[31m 4 \x1b[0m|\x1b[31m Unique Key Conflict \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`conflict_view`   \x1b[0m|\n" +
+		"+---+---------------------+-------------+--------------------------------+\n"
+	require.Equal(t, expected, output)
+
+	em.conflictV2Enabled = true
+	em.conflictV1Enabled = false
+	output = em.Output()
+	expected = "\n" +
+		"Import Data Error Summary: \n" +
+		"+---+---------------------+-------------+--------------------------------+\n" +
+		"| # | ERROR TYPE          | ERROR COUNT | ERROR DATA TABLE               |\n" +
+		"+---+---------------------+-------------+--------------------------------+\n" +
+		"|\x1b[31m 1 \x1b[0m|\x1b[31m Data Type           \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`type_error_v2`   \x1b[0m|\n" +
+		"|\x1b[31m 2 \x1b[0m|\x1b[31m Data Syntax         \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`syntax_error_v2` \x1b[0m|\n" +
+		"|\x1b[31m 3 \x1b[0m|\x1b[31m Charset Error       \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m                                \x1b[0m|\n" +
+		"|\x1b[31m 4 \x1b[0m|\x1b[31m Unique Key Conflict \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`conflict_view`   \x1b[0m|\n" +
+		"+---+---------------------+-------------+--------------------------------+\n"
+	require.Equal(t, expected, output)
+
+	em.conflictV2Enabled = true
+	em.conflictV1Enabled = true
+	output = em.Output()
+	expected = "\n" +
+		"Import Data Error Summary: \n" +
+		"+---+---------------------+-------------+--------------------------------+\n" +
+		"| # | ERROR TYPE          | ERROR COUNT | ERROR DATA TABLE               |\n" +
+		"+---+---------------------+-------------+--------------------------------+\n" +
+		"|\x1b[31m 1 \x1b[0m|\x1b[31m Data Type           \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`type_error_v2`   \x1b[0m|\n" +
+		"|\x1b[31m 2 \x1b[0m|\x1b[31m Data Syntax         \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`syntax_error_v2` \x1b[0m|\n" +
+		"|\x1b[31m 3 \x1b[0m|\x1b[31m Charset Error       \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m                                \x1b[0m|\n" +
+		"|\x1b[31m 4 \x1b[0m|\x1b[31m Unique Key Conflict \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `error_info`.`conflict_view`   \x1b[0m|\n" +
+		"+---+---------------------+-------------+--------------------------------+\n"
+	require.Equal(t, expected, output)
+
+	em.schema = "long_long_long_long_long_long_long_long_dbname"
+	output = em.Output()
+	expected = "\n" +
+		"Import Data Error Summary: \n" +
+		"+---+---------------------+-------------+--------------------------------------------------------------------+\n" +
+		"| # | ERROR TYPE          | ERROR COUNT | ERROR DATA TABLE                                                   |\n" +
+		"+---+---------------------+-------------+--------------------------------------------------------------------+\n" +
+		"|\x1b[31m 1 \x1b[0m|\x1b[31m Data Type           \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `long_long_long_long_long_long_long_long_dbname`.`type_error_v2`   \x1b[0m|\n" +
+		"|\x1b[31m 2 \x1b[0m|\x1b[31m Data Syntax         \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `long_long_long_long_long_long_long_long_dbname`.`syntax_error_v2` \x1b[0m|\n" +
+		"|\x1b[31m 3 \x1b[0m|\x1b[31m Charset Error       \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m                                                                    \x1b[0m|\n" +
+		"|\x1b[31m 4 \x1b[0m|\x1b[31m Unique Key Conflict \x1b[0m|\x1b[31m         100 \x1b[0m|\x1b[31m `long_long_long_long_long_long_long_long_dbname`.`conflict_view`   \x1b[0m|\n" +
+		"+---+---------------------+-------------+--------------------------------------------------------------------+\n"
+	require.Equal(t, expected, output)
+}