Skip to content

Commit

Permalink
planner: fix RANGE COLUMNS partition prune gives wrong result with sp…
Browse files Browse the repository at this point in the history
…ecial collation (#57344) (#57407)

close #57261
  • Loading branch information
ti-chi-bot authored Nov 15, 2024
1 parent 6e6a012 commit 9112d43
Show file tree
Hide file tree
Showing 3 changed files with 65 additions and 17 deletions.
54 changes: 54 additions & 0 deletions pkg/planner/core/partition_pruning_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -575,6 +575,60 @@ func TestPartitionRangeColumnsForExpr(t *testing.T) {
}
}

func TestPartitionRangeColumnsForExprWithSpecialCollation(t *testing.T) {
tc := prepareTestCtx(t, "create table t (a varchar(255) COLLATE utf8mb4_0900_ai_ci, b varchar(255) COLLATE utf8mb4_unicode_ci)", "a,b")
lessThan := make([][]*expression.Expression, 0, 6)
partDefs := [][]string{
{"'i'", "'i'"},
{"MAXVALUE", "MAXVALUE"},
}
for i := range partDefs {
l := make([]*expression.Expression, 0, 2)
for j := range []int{0, 1} {
v := partDefs[i][j]
var e *expression.Expression
if v == "MAXVALUE" {
e = nil // MAXVALUE
} else {
expr, err := expression.ParseSimpleExpr(tc.sctx, v, expression.WithInputSchemaAndNames(tc.schema, tc.names, nil))
require.NoError(t, err)
e = &expr
}
l = append(l, e)
}
lessThan = append(lessThan, l)
}
pruner := &rangeColumnsPruner{lessThan, tc.columns[:2]}
cases := []struct {
input string
result partitionRangeOR
}{
{"a = 'q'", partitionRangeOR{{1, 2}}},
{"a = 'Q'", partitionRangeOR{{1, 2}}},
{"a = 'a'", partitionRangeOR{{0, 1}}},
{"a = 'A'", partitionRangeOR{{0, 1}}},
{"a > 'a'", partitionRangeOR{{0, 2}}},
{"a > 'q'", partitionRangeOR{{1, 2}}},
{"a = 'i' and b = 'q'", partitionRangeOR{{1, 2}}},
{"a = 'i' and b = 'Q'", partitionRangeOR{{1, 2}}},
{"a = 'i' and b = 'a'", partitionRangeOR{{0, 1}}},
{"a = 'i' and b = 'A'", partitionRangeOR{{0, 1}}},
{"a = 'i' and b > 'a'", partitionRangeOR{{0, 2}}},
{"a = 'i' and b > 'q'", partitionRangeOR{{1, 2}}},
{"a = 'i' or a = 'h'", partitionRangeOR{{0, 2}}},
{"a = 'h' and a = 'j'", partitionRangeOR{}},
}

for _, ca := range cases {
expr, err := expression.ParseSimpleExpr(tc.sctx, ca.input, expression.WithInputSchemaAndNames(tc.schema, tc.names, nil))
require.NoError(t, err)
result := fullRange(len(lessThan))
e := expression.SplitCNFItems(expr)
result = partitionRangeForCNFExpr(tc.sctx, e, pruner, result)
require.Truef(t, equalPartitionRangeOR(ca.result, result), "unexpected: %v %v != %v", ca.input, ca.result, result)
}
}

func benchmarkRangeColumnsPruner(b *testing.B, parts int) {
tc := prepareBenchCtx("create table t (a bigint unsigned, b int, c int)", "a")
if tc == nil {
Expand Down
13 changes: 4 additions & 9 deletions pkg/planner/core/rule_partition_processor.go
Original file line number Diff line number Diff line change
Expand Up @@ -1320,7 +1320,7 @@ func multiColumnRangeColumnsPruner(sctx base.PlanContext, exprs []expression.Exp
lens = append(lens, columnsPruner.partCols[i].RetType.GetFlen())
}

res, err := ranger.DetachCondAndBuildRangeForIndex(sctx.GetRangerCtx(), exprs, columnsPruner.partCols, lens, sctx.GetSessionVars().RangeMaxSize)
res, err := ranger.DetachCondAndBuildRangeForPartition(sctx.GetRangerCtx(), exprs, columnsPruner.partCols, lens, sctx.GetSessionVars().RangeMaxSize)
if err != nil {
return fullRange(len(columnsPruner.lessThan))
}
Expand All @@ -1335,16 +1335,12 @@ func multiColumnRangeColumnsPruner(sctx base.PlanContext, exprs []expression.Exp

rangeOr := make([]partitionRange, 0, len(res.Ranges))

comparer := make([]collate.Collator, 0, len(columnsPruner.partCols))
for i := range columnsPruner.partCols {
comparer = append(comparer, collate.GetCollator(columnsPruner.partCols[i].RetType.GetCollate()))
}
gotError := false
// Create a sort.Search where the compare loops over ColumnValues
// Loop over the different ranges and extend/include all the partitions found
for idx := range res.Ranges {
minComparer := minCmp(sctx, res.Ranges[idx].LowVal, columnsPruner, comparer, res.Ranges[idx].LowExclude, &gotError)
maxComparer := maxCmp(sctx, res.Ranges[idx].HighVal, columnsPruner, comparer, res.Ranges[idx].HighExclude, &gotError)
minComparer := minCmp(sctx, res.Ranges[idx].LowVal, columnsPruner, res.Ranges[idx].Collators, res.Ranges[idx].LowExclude, &gotError)
maxComparer := maxCmp(sctx, res.Ranges[idx].HighVal, columnsPruner, res.Ranges[idx].Collators, res.Ranges[idx].HighExclude, &gotError)
if gotError {
// the compare function returned error, use all partitions.
return fullRange(len(columnsPruner.lessThan))
Expand Down Expand Up @@ -1953,10 +1949,9 @@ func makeRangeColumnPruner(columns []*expression.Column, pi *model.PartitionInfo
if len(pi.Definitions) != len(from.LessThan) {
return nil, errors.Trace(fmt.Errorf("internal error len(pi.Definitions) != len(from.LessThan) %d != %d", len(pi.Definitions), len(from.LessThan)))
}
schema := expression.NewSchema(columns...)
partCols := make([]*expression.Column, len(offsets))
for i, offset := range offsets {
partCols[i] = schema.Columns[offset]
partCols[i] = columns[offset]
}
lessThan := make([][]*expression.Expression, 0, len(from.LessThan))
for i := range from.LessThan {
Expand Down
15 changes: 7 additions & 8 deletions pkg/util/ranger/detacher.go
Original file line number Diff line number Diff line change
Expand Up @@ -323,7 +323,7 @@ func extractBestCNFItemRanges(sctx *rangerctx.RangerContext, conds []expression.
// We build ranges for `(a,b) in ((1,1),(1,2))` and get `[1 1, 1 1] [1 2, 1 2]`, which are point ranges and we can
// append `c = 1` to the point ranges. However, if we choose to merge consecutive ranges here, we get `[1 1, 1 2]`,
// which are not point ranges, and we cannot append `c = 1` anymore.
res, err := detachCondAndBuildRangeWithoutMerging(sctx, tmpConds, cols, lengths, rangeMaxSize, convertToSortKey)
res, err := detachCondAndBuildRange(sctx, tmpConds, cols, lengths, rangeMaxSize, convertToSortKey, false)
if err != nil {
return nil, nil, err
}
Expand Down Expand Up @@ -479,7 +479,7 @@ func (d *rangeDetacher) detachCNFCondAndBuildRangeForIndex(conditions []expressi
if eqOrInCount > 0 {
newCols := d.cols[eqOrInCount:]
newLengths := d.lengths[eqOrInCount:]
tailRes, err := DetachCondAndBuildRangeForIndex(d.sctx, newConditions, newCols, newLengths, d.rangeMaxSize)
tailRes, err := detachCondAndBuildRange(d.sctx, newConditions, newCols, newLengths, d.rangeMaxSize, d.convertToSortKey, d.mergeConsecutive)
if err != nil {
return nil, err
}
Expand Down Expand Up @@ -1004,16 +1004,15 @@ func DetachCondAndBuildRangeForIndex(sctx *rangerctx.RangerContext, conditions [
return d.detachCondAndBuildRangeForCols()
}

// detachCondAndBuildRangeWithoutMerging detaches the index filters from table filters and uses them to build ranges.
// When building ranges, it doesn't merge consecutive ranges.
func detachCondAndBuildRangeWithoutMerging(sctx *rangerctx.RangerContext, conditions []expression.Expression, cols []*expression.Column,
lengths []int, rangeMaxSize int64, convertToSortKey bool) (*DetachRangeResult, error) {
// detachCondAndBuildRange detaches the index filters from table filters and uses them to build ranges.
func detachCondAndBuildRange(sctx *rangerctx.RangerContext, conditions []expression.Expression, cols []*expression.Column,
lengths []int, rangeMaxSize int64, convertToSortKey bool, mergeConsecutive bool) (*DetachRangeResult, error) {
d := &rangeDetacher{
sctx: sctx,
allConds: conditions,
cols: cols,
lengths: lengths,
mergeConsecutive: false,
mergeConsecutive: mergeConsecutive,
convertToSortKey: convertToSortKey,
rangeMaxSize: rangeMaxSize,
}
Expand All @@ -1026,7 +1025,7 @@ func detachCondAndBuildRangeWithoutMerging(sctx *rangerctx.RangerContext, condit
// The returned values are encapsulated into a struct DetachRangeResult, see its comments for explanation.
func DetachCondAndBuildRangeForPartition(sctx *rangerctx.RangerContext, conditions []expression.Expression, cols []*expression.Column,
lengths []int, rangeMaxSize int64) (*DetachRangeResult, error) {
return detachCondAndBuildRangeWithoutMerging(sctx, conditions, cols, lengths, rangeMaxSize, false)
return detachCondAndBuildRange(sctx, conditions, cols, lengths, rangeMaxSize, false, false)
}

type rangeDetacher struct {
Expand Down

0 comments on commit 9112d43

Please # to comment.