Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

release-22.2: colbuilder: fix aggregation with no aggregate funcs #87682

Merged
merged 1 commit into from
Sep 12, 2022
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
25 changes: 0 additions & 25 deletions pkg/sql/colexec/colbuilder/execplan.go
Original file line number Diff line number Diff line change
Expand Up @@ -804,31 +804,6 @@ func NewColOperator(
return r, err
}
aggSpec := core.Aggregator
if len(aggSpec.Aggregations) == 0 {
// We can get an aggregator when no aggregate functions are
// present if HAVING clause is present, for example, with a
// query as follows: SELECT 1 FROM t HAVING true. In this case,
// we plan a special operator that outputs a batch of length 1
// or 0 (depending on whether the aggregate is in scalar context
// or not) without actual columns once and then zero-length
// batches. The actual "data" will be added by projections
// below.
// TODO(solon): The distsql plan for this case includes a
// TableReader, so we end up creating an orphaned colBatchScan.
// We should avoid that. Ideally the optimizer would not plan a
// scan in this unusual case.
numTuples := 0
if aggSpec.IsScalar() {
numTuples = 1
}
result.Root, err = colexecutils.NewFixedNumTuplesNoInputOp(
getStreamingAllocator(ctx, args), numTuples, inputs[0].Root,
), nil
// We make ColumnTypes non-nil so that sanity check doesn't
// panic.
result.ColumnTypes = []*types.T{}
break
}
if aggSpec.IsRowCount() {
result.Root, err = colexec.NewCountOp(getStreamingAllocator(ctx, args), inputs[0].Root), nil
result.ColumnTypes = []*types.T{types.Int}
Expand Down
15 changes: 13 additions & 2 deletions pkg/sql/colexec/colexecbase/distinct.go
Original file line number Diff line number Diff line change
Expand Up @@ -35,8 +35,19 @@ func OrderedDistinctColsToOperators(
OneInputHelper: colexecop.MakeOneInputHelper(input),
fn: func() { copy(distinctCol, colexecutils.ZeroBoolColumn) },
}
for i := range distinctCols {
input = newSingleDistinct(input, int(distinctCols[i]), distinctCol, typs[distinctCols[i]], nullsAreDistinct)
if len(distinctCols) > 0 {
for i := range distinctCols {
input = newSingleDistinct(input, int(distinctCols[i]), distinctCol, typs[distinctCols[i]], nullsAreDistinct)
}
} else {
// If there are no distinct columns, we have to mark the very first
// tuple as distinct ourselves.
firstTuple := true
input.(*fnOp).fn = func() {
copy(distinctCol, colexecutils.ZeroBoolColumn)
distinctCol[0] = firstTuple
firstTuple = false
}
}
r, ok := input.(colexecop.ResettableOperator)
if !ok {
Expand Down
13 changes: 12 additions & 1 deletion pkg/sql/colexec/ordered_aggregator.go
Original file line number Diff line number Diff line change
Expand Up @@ -255,7 +255,18 @@ func (a *orderedAggregator) Next() coldata.Batch {
}
})
}
a.scratch.resumeIdx = a.bucket.fns[0].CurrentOutputIndex()
if len(a.bucket.fns) > 0 {
a.scratch.resumeIdx = a.bucket.fns[0].CurrentOutputIndex()
} else {
// When there are no aggregate functions to compute, we
// simply need to output the same number of empty rows as
// the number of groups.
for _, newGroup := range a.groupCol[:batchLength] {
if newGroup {
a.scratch.resumeIdx++
}
}
}
}
if batchLength == 0 {
a.state = orderedAggregatorOutputting
Expand Down
16 changes: 16 additions & 0 deletions pkg/sql/logictest/testdata/logic_test/vectorize_agg
Original file line number Diff line number Diff line change
Expand Up @@ -55,3 +55,19 @@ NULL NULL
1 1
22 22
33 33

# Regression test for incorrect handling of non-scalar GROUP BY with no
# aggregate functions (#87619).
statement ok
CREATE TABLE t87619 (b) AS SELECT true;
SET testing_optimizer_random_seed = 3164997759865821235;
SET testing_optimizer_disable_rule_probability = 0.500000;

query B
SELECT true FROM t87619 GROUP BY b HAVING b
----
true

statement ok
RESET testing_optimizer_random_seed;
RESET testing_optimizer_disable_rule_probability;