-
Notifications
You must be signed in to change notification settings - Fork 1.3k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
optimize queries where lhs and rhs of predicate are equal (#10444)
- Loading branch information
Showing
8 changed files
with
377 additions
and
162 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
129 changes: 129 additions & 0 deletions
129
...in/java/org/apache/pinot/core/query/optimizer/filter/BaseAndOrBooleanFilterOptimizer.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,129 @@ | ||
/** | ||
* Licensed to the Apache Software Foundation (ASF) under one | ||
* or more contributor license agreements. See the NOTICE file | ||
* distributed with this work for additional information | ||
* regarding copyright ownership. The ASF licenses this file | ||
* to you under the Apache License, Version 2.0 (the | ||
* "License"); you may not use this file except in compliance | ||
* with the License. You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, | ||
* software distributed under the License is distributed on an | ||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
* KIND, either express or implied. See the License for the | ||
* specific language governing permissions and limitations | ||
* under the License. | ||
*/ | ||
package org.apache.pinot.core.query.optimizer.filter; | ||
|
||
import java.util.List; | ||
import javax.annotation.Nullable; | ||
import org.apache.pinot.common.request.Expression; | ||
import org.apache.pinot.common.request.Function; | ||
import org.apache.pinot.common.utils.request.RequestUtils; | ||
import org.apache.pinot.spi.data.Schema; | ||
import org.apache.pinot.sql.FilterKind; | ||
|
||
|
||
/** | ||
* This base class acts as a helper for any optimizer that is effectively removing filter conditions. | ||
* It provides TRUE/FALSE literal classes that can be used to replace filter expressions that are always true/false. | ||
* It provides an optimization implementation for AND/OR/NOT expressions. | ||
*/ | ||
public abstract class BaseAndOrBooleanFilterOptimizer implements FilterOptimizer { | ||
|
||
protected static final Expression TRUE = RequestUtils.getLiteralExpression(true); | ||
protected static final Expression FALSE = RequestUtils.getLiteralExpression(false); | ||
|
||
/** | ||
* This recursively optimizes each part of the filter expression. For any AND/OR/NOT, | ||
* we optimize each child, then we optimize the remaining statement. If there is only | ||
* a child statement, we optimize that. | ||
*/ | ||
@Override | ||
public Expression optimize(Expression filterExpression, @Nullable Schema schema) { | ||
if (!canBeOptimized(filterExpression, schema)) { | ||
return filterExpression; | ||
} | ||
|
||
Function function = filterExpression.getFunctionCall(); | ||
List<Expression> operands = function.getOperands(); | ||
FilterKind kind = FilterKind.valueOf(function.getOperator()); | ||
switch (kind) { | ||
case AND: | ||
case OR: | ||
case NOT: | ||
// Recursively traverse the expression tree to find an operator node that can be rewritten. | ||
operands.replaceAll(operand -> optimize(operand, schema)); | ||
|
||
// We have rewritten the child operands, so rewrite the parent if needed. | ||
return optimizeCurrent(filterExpression); | ||
default: | ||
return optimizeChild(filterExpression, schema); | ||
} | ||
} | ||
|
||
abstract boolean canBeOptimized(Expression filterExpression, @Nullable Schema schema); | ||
|
||
/** | ||
* Optimize any cases that are not AND/OR/NOT. This should be done by converting any cases | ||
* that are always true to TRUE or always false to FALSE. | ||
*/ | ||
abstract Expression optimizeChild(Expression filterExpression, @Nullable Schema schema); | ||
|
||
/** | ||
* If any of the operands of AND function is "false", then the AND function itself is false and can be replaced with | ||
* "false" literal. Otherwise, remove all the "true" operands of the AND function. Similarly, if any of the operands | ||
* of OR function is "true", then the OR function itself is true and can be replaced with "true" literal. Otherwise, | ||
* remove all the "false" operands of the OR function. | ||
*/ | ||
protected Expression optimizeCurrent(Expression expression) { | ||
Function function = expression.getFunctionCall(); | ||
String operator = function.getOperator(); | ||
List<Expression> operands = function.getOperands(); | ||
if (operator.equals(FilterKind.AND.name())) { | ||
// If any of the literal operands are always false, then replace AND function with FALSE. | ||
for (Expression operand : operands) { | ||
if (operand.equals(FALSE)) { | ||
return FALSE; | ||
} | ||
} | ||
|
||
// Remove all Literal operands that are always true. | ||
operands.removeIf(operand -> operand.equals(TRUE)); | ||
if (operands.isEmpty()) { | ||
return TRUE; | ||
} | ||
} else if (operator.equals(FilterKind.OR.name())) { | ||
// If any of the literal operands are always true, then replace OR function with TRUE | ||
for (Expression operand : operands) { | ||
if (operand.equals(TRUE)) { | ||
return TRUE; | ||
} | ||
} | ||
|
||
// Remove all Literal operands that are always false. | ||
operands.removeIf(operand -> operand.equals(FALSE)); | ||
if (operands.isEmpty()) { | ||
return FALSE; | ||
} | ||
} else if (operator.equals(FilterKind.NOT.name())) { | ||
assert operands.size() == 1; | ||
Expression operand = operands.get(0); | ||
if (operand.equals(TRUE)) { | ||
return FALSE; | ||
} | ||
if (operand.equals(FALSE)) { | ||
return TRUE; | ||
} | ||
} | ||
return expression; | ||
} | ||
|
||
/** Change the expression value to boolean literal with given value. */ | ||
protected static Expression getExpressionFromBoolean(boolean value) { | ||
return value ? TRUE : FALSE; | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
106 changes: 106 additions & 0 deletions
106
.../java/org/apache/pinot/core/query/optimizer/filter/IdenticalPredicateFilterOptimizer.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,106 @@ | ||
/** | ||
* Licensed to the Apache Software Foundation (ASF) under one | ||
* or more contributor license agreements. See the NOTICE file | ||
* distributed with this work for additional information | ||
* regarding copyright ownership. The ASF licenses this file | ||
* to you under the Apache License, Version 2.0 (the | ||
* "License"); you may not use this file except in compliance | ||
* with the License. You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, | ||
* software distributed under the License is distributed on an | ||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
* KIND, either express or implied. See the License for the | ||
* specific language governing permissions and limitations | ||
* under the License. | ||
*/ | ||
package org.apache.pinot.core.query.optimizer.filter; | ||
|
||
import java.util.List; | ||
import javax.annotation.Nullable; | ||
import org.apache.pinot.common.request.Expression; | ||
import org.apache.pinot.common.request.Function; | ||
import org.apache.pinot.spi.data.Schema; | ||
import org.apache.pinot.sql.FilterKind; | ||
|
||
|
||
/** | ||
* This optimizer converts all predicates where the left hand side == right hand side to | ||
* a simple TRUE/FALSE literal value. While filters like, WHERE 1=1 OR "col1"="col1" are not | ||
* typical, they end up expensive in Pinot because they are rewritten as A-A==0. | ||
*/ | ||
public class IdenticalPredicateFilterOptimizer extends BaseAndOrBooleanFilterOptimizer { | ||
|
||
@Override | ||
boolean canBeOptimized(Expression filterExpression, @Nullable Schema schema) { | ||
// if there's no function call, there's no lhs or rhs | ||
return filterExpression.getFunctionCall() != null; | ||
} | ||
|
||
@Override | ||
Expression optimizeChild(Expression filterExpression, @Nullable Schema schema) { | ||
Function function = filterExpression.getFunctionCall(); | ||
FilterKind kind = FilterKind.valueOf(function.getOperator()); | ||
switch (kind) { | ||
case EQUALS: | ||
if (hasIdenticalLhsAndRhs(function.getOperands())) { | ||
return TRUE; | ||
} | ||
break; | ||
case NOT_EQUALS: | ||
if (hasIdenticalLhsAndRhs(function.getOperands())) { | ||
return FALSE; | ||
} | ||
break; | ||
default: | ||
break; | ||
} | ||
return filterExpression; | ||
} | ||
|
||
/** | ||
* Pinot queries of the WHERE 1 != 1 AND "col1" = "col2" variety are rewritten as | ||
* 1-1 != 0 AND "col1"-"col2" = 0. Therefore, we check specifically for the case where | ||
* the operand is set up in this fashion. | ||
* | ||
* We return false specifically after every check to ensure we're only continuing when | ||
* the input looks as expected. Otherwise, it's easy to for one of the operand functions | ||
* to return null and fail the query. | ||
* | ||
* TODO: The rewrite is already happening in PredicateComparisonRewriter.updateFunctionExpression(), | ||
* so we might just compare the lhs and rhs there. | ||
*/ | ||
private boolean hasIdenticalLhsAndRhs(List<Expression> operands) { | ||
boolean hasTwoChildren = operands.size() == 2; | ||
Expression firstChild = operands.get(0); | ||
if (firstChild.getFunctionCall() == null || !hasTwoChildren) { | ||
return false; | ||
} | ||
boolean firstChildIsMinusOperator = firstChild.getFunctionCall().getOperator().equals("minus"); | ||
if (!firstChildIsMinusOperator) { | ||
return false; | ||
} | ||
boolean firstChildHasTwoOperands = firstChild.getFunctionCall().getOperandsSize() == 2; | ||
if (!firstChildHasTwoOperands) { | ||
return false; | ||
} | ||
Expression minusOperandFirstChild = firstChild.getFunctionCall().getOperands().get(0); | ||
Expression minusOperandSecondChild = firstChild.getFunctionCall().getOperands().get(1); | ||
if (minusOperandFirstChild == null || minusOperandSecondChild == null || !minusOperandFirstChild.equals( | ||
minusOperandSecondChild)) { | ||
return false; | ||
} | ||
Expression secondChild = operands.get(1); | ||
return isLiteralZero(secondChild); | ||
} | ||
|
||
private boolean isLiteralZero(Expression expression) { | ||
if (!expression.isSetLiteral()) { | ||
return false; | ||
} | ||
Object literalValue = expression.getLiteral().getFieldValue(); | ||
return literalValue.equals(0) || literalValue.equals(0L) || literalValue.equals(0d); | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.