Skip to content

Commit

Permalink
diff: add config to only use checksum, skip select data (pingcap#215)
Browse files Browse the repository at this point in the history
  • Loading branch information
WangXiangUSTC committed Apr 9, 2019
1 parent 64d87c4 commit 7df5696
Show file tree
Hide file tree
Showing 4 changed files with 31 additions and 1 deletion.
8 changes: 8 additions & 0 deletions pkg/diff/diff.go
Original file line number Diff line number Diff line change
Expand Up @@ -74,6 +74,9 @@ type TableDiff struct {
// set false if want to comapre the data directly
UseChecksum bool

// set true if just want compare data by checksum, will skip select data when checksum is not equal
OnlyUseChecksum bool

// collation config in mysql/tidb, should corresponding to charset.
Collation string

Expand Down Expand Up @@ -284,6 +287,11 @@ func (t *TableDiff) checkChunkDataEqual(ctx context.Context, checkJobs []*CheckJ
log.Warnf("table: %s, range: %s, args: %v, checksum is not equal, one is %d, another is %d", dbutil.TableName(job.Schema, job.Table), job.Where, job.Args, sourceChecksum, targetChecksum)
}

if t.UseChecksum && t.OnlyUseChecksum {
equal = false
continue
}

// if checksum is not equal or don't need compare checksum, compare the data
log.Infof("select data from %s for range (where: %s, args: %v) and then check data", dbutil.TableName(job.Schema, job.Table), job.Where, job.Args)
sourceRows := make(map[string][]map[string]*dbutil.ColumnData)
Expand Down
15 changes: 15 additions & 0 deletions sync_diff_inspector/config.go
Original file line number Diff line number Diff line change
Expand Up @@ -180,6 +180,9 @@ type Config struct {
// set false if want to comapre the data directly
UseChecksum bool `toml:"use-checksum" json:"use-checksum"`

// set true if just want compare data by checksum, will skip select data when checksum is not equal.
OnlyUseChecksum bool `toml:"only-use-checksum" json:"only-use-checksum"`

// the name of the file which saves sqls used to fix different data
FixSQLFile string `toml:"fix-sql-file" json:"fix-sql-file"`

Expand Down Expand Up @@ -312,5 +315,17 @@ func (c *Config) checkConfig() bool {
}
}

if c.OnlyUseChecksum {
if !c.UseChecksum {
log.Error("need set use-checksum = true")
return false
}
} else {
if len(c.FixSQLFile) == 0 {
log.Warn("fix-sql-file is invalid, will use default value 'fix.sql'")
c.FixSQLFile = "fix.sql"
}
}

return true
}
6 changes: 5 additions & 1 deletion sync_diff_inspector/config.toml
Original file line number Diff line number Diff line change
Expand Up @@ -18,15 +18,19 @@ sample-percent = 100
use-rowid = false

# calculate the data's checksum, and compare data by checksum.
# set false if want to comapre the data directly
use-checksum = true

# set true if just want compare data by checksum, will skip select data when checksum is not equal.
only-use-checksum = false

# ignore check table's data
ignore-data-check = false

# ignore check table's struct
ignore-struct-check = false

# the name of the file which saves sqls used to fix different data
# the name of the file which saves sqls used to fix different data.
fix-sql-file = "fix.sql"

# use this tidb's statistics information to split chunk
Expand Down
3 changes: 3 additions & 0 deletions sync_diff_inspector/diff.go
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,7 @@ type Diff struct {
checkThreadCount int
useRowID bool
useChecksum bool
onlyUseChecksum bool
ignoreDataCheck bool
ignoreStructCheck bool
tables map[string]map[string]*TableConfig
Expand All @@ -56,6 +57,7 @@ func NewDiff(ctx context.Context, cfg *Config) (diff *Diff, err error) {
checkThreadCount: cfg.CheckThreadCount,
useRowID: cfg.UseRowID,
useChecksum: cfg.UseChecksum,
onlyUseChecksum: cfg.OnlyUseChecksum,
ignoreDataCheck: cfg.IgnoreDataCheck,
ignoreStructCheck: cfg.IgnoreStructCheck,
tidbInstanceID: cfg.TiDBInstanceID,
Expand Down Expand Up @@ -404,6 +406,7 @@ func (df *Diff) Equal() (err error) {
CheckThreadCount: df.checkThreadCount,
UseRowID: df.useRowID,
UseChecksum: df.useChecksum,
OnlyUseChecksum: df.onlyUseChecksum,
IgnoreStructCheck: df.ignoreStructCheck,
IgnoreDataCheck: df.ignoreDataCheck,
TiDBStatsSource: tidbStatsSource,
Expand Down

0 comments on commit 7df5696

Please sign in to comment.