From 2cd8d46158360f6a120f8834131e1456a02cd38d Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Fri, 18 Nov 2022 17:41:44 -0800 Subject: [PATCH 01/16] Add new table scan builder and optimizer rules Signed-off-by: Chen Dai --- .../sql/planner/DefaultImplementor.java | 6 + .../logical/LogicalPlanNodeVisitor.java | 6 + .../optimizer/LogicalPlanOptimizer.java | 23 +- .../planner/optimizer/pattern/Patterns.java | 77 +++ .../rule/scan/CreateTableScanBuilder.java | 47 ++ .../rule/scan/TableScanPushDown.java | 119 ++++ .../org/opensearch/sql/storage/Table.java | 12 + .../sql/storage/TableScanBuilder.java | 64 ++ .../sql/planner/DefaultImplementorTest.java | 15 + .../logical/LogicalPlanNodeVisitorTest.java | 11 + .../optimizer/LogicalPlanOptimizerTest.java | 170 ++++- .../optimizer/pattern/PatternsTest.java | 9 + .../logical/OpenSearchLogicalIndexAgg.java | 80 --- .../logical/OpenSearchLogicalIndexScan.java | 97 --- ...OpenSearchLogicalPlanOptimizerFactory.java | 47 -- .../logical/rule/MergeAggAndIndexScan.java | 57 -- .../logical/rule/MergeAggAndRelation.java | 54 -- .../logical/rule/MergeFilterAndRelation.java | 53 -- .../logical/rule/MergeLimitAndIndexScan.java | 54 -- .../logical/rule/MergeLimitAndRelation.java | 49 -- .../logical/rule/MergeSortAndIndexAgg.java | 82 --- .../logical/rule/MergeSortAndIndexScan.java | 70 --- .../logical/rule/MergeSortAndRelation.java | 53 -- .../logical/rule/OptimizationRuleUtils.java | 66 -- .../logical/rule/PushProjectAndIndexScan.java | 63 -- .../logical/rule/PushProjectAndRelation.java | 67 -- .../agg/CompositeAggregationParser.java | 2 + .../opensearch/response/agg/FilterParser.java | 2 + .../response/agg/MetricParserHelper.java | 2 + .../response/agg/SingleValueParser.java | 2 + .../opensearch/response/agg/StatsParser.java | 2 + .../response/agg/TopHitsParser.java | 2 + .../opensearch/storage/OpenSearchIndex.java | 107 +--- .../OpenSearchAggregateIndexScanBuilder.java | 98 +++ .../scan/OpenSearchIndexScanBuilder.java | 87 +++ .../OpenSearchSimpleIndexScanBuilder.java | 133 ++++ .../logical/OpenSearchLogicOptimizerTest.java | 576 ----------------- .../OpenSearchLogicalIndexScanTest.java | 24 - .../OpenSearchDefaultImplementorTest.java | 36 +- .../storage/OpenSearchIndexTest.java | 232 +------ .../OpenSearchIndexScanOptimizationTest.java | 584 ++++++++++++++++++ .../sql/opensearch/utils/Utils.java | 131 ---- 42 files changed, 1484 insertions(+), 1987 deletions(-) create mode 100644 core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java create mode 100644 core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java create mode 100644 core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexAgg.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScan.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalPlanOptimizerFactory.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndIndexScan.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndRelation.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeFilterAndRelation.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndIndexScan.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndRelation.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexAgg.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexScan.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndRelation.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/OptimizationRuleUtils.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndIndexScan.java delete mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndRelation.java create mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchAggregateIndexScanBuilder.java create mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java create mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java delete mode 100644 opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicOptimizerTest.java delete mode 100644 opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScanTest.java create mode 100644 opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java diff --git a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java index 9f2c2c5fa8..db9b0e8fae 100644 --- a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java +++ b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java @@ -34,6 +34,7 @@ import org.opensearch.sql.planner.physical.SortOperator; import org.opensearch.sql.planner.physical.ValuesOperator; import org.opensearch.sql.planner.physical.WindowOperator; +import org.opensearch.sql.storage.TableScanBuilder; /** * Default implementor for implementing logical to physical translation. "Default" here means all @@ -123,6 +124,11 @@ public PhysicalPlan visitLimit(LogicalLimit node, C context) { return new LimitOperator(visitChild(node, context), node.getLimit(), node.getOffset()); } + @Override + public PhysicalPlan visitScanBuilder(TableScanBuilder plan, C context) { + return plan.build(); + } + @Override public PhysicalPlan visitRelation(LogicalRelation node, C context) { throw new UnsupportedOperationException("Storage engine is responsible for " diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java index 28539562e7..9840e3942d 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java @@ -6,6 +6,8 @@ package org.opensearch.sql.planner.logical; +import org.opensearch.sql.storage.TableScanBuilder; + /** * The visitor of {@link LogicalPlan}. * @@ -22,6 +24,10 @@ public R visitRelation(LogicalRelation plan, C context) { return visitNode(plan, context); } + public R visitScanBuilder(TableScanBuilder plan, C context) { + return visitNode(plan, context); + } + public R visitFilter(LogicalFilter plan, C context) { return visitNode(plan, context); } diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java index 0e547df68d..d21abe182f 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java @@ -15,6 +15,8 @@ import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.optimizer.rule.MergeFilterAndFilter; import org.opensearch.sql.planner.optimizer.rule.PushFilterUnderSort; +import org.opensearch.sql.planner.optimizer.rule.scan.CreateTableScanBuilder; +import org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown; /** * {@link LogicalPlan} Optimizer. @@ -39,8 +41,20 @@ public LogicalPlanOptimizer(List> rules) { */ public static LogicalPlanOptimizer create() { return new LogicalPlanOptimizer(Arrays.asList( + /* + * Phase 1: Transformations rely on static relation algebra equivalence + */ new MergeFilterAndFilter(), - new PushFilterUnderSort())); + new PushFilterUnderSort(), + /* + * Phase 2: Transformations rely on connector push down capability + */ + new CreateTableScanBuilder(), + TableScanPushDown.PUSH_DOWN_FILTER, + TableScanPushDown.PUSH_DOWN_AGGREGATION, + TableScanPushDown.PUSH_DOWN_SORT, + TableScanPushDown.PUSH_DOWN_LIMIT, + TableScanPushDown.PUSH_DOWN_PROJECT)); } /** @@ -63,7 +77,12 @@ private LogicalPlan internalOptimize(LogicalPlan plan) { Match match = DEFAULT_MATCHER.match(rule.pattern(), node); if (match.isPresent()) { node = rule.apply(match.value(), match.captures()); - done = false; + + // Re-iterate all rules against the node if the node is replaced by any rule + // TODO: may need to introduce fixed point or maximum iteration limit in future + if (node != match.value()) { + done = false; + } } } } diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java index 73d0f8c577..b9768351c4 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java @@ -6,10 +6,21 @@ package org.opensearch.sql.planner.optimizer.pattern; +import com.facebook.presto.matching.Capture; +import com.facebook.presto.matching.Pattern; import com.facebook.presto.matching.Property; +import com.facebook.presto.matching.PropertyPattern; import java.util.Optional; import lombok.experimental.UtilityClass; +import org.opensearch.sql.planner.logical.LogicalAggregation; +import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalLimit; import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.logical.LogicalProject; +import org.opensearch.sql.planner.logical.LogicalRelation; +import org.opensearch.sql.planner.logical.LogicalSort; +import org.opensearch.sql.storage.Table; +import org.opensearch.sql.storage.TableScanBuilder; /** * Pattern helper class. @@ -17,6 +28,48 @@ @UtilityClass public class Patterns { + /** + * Logical filter with a given pattern on inner field. + */ + public static Pattern filter(Pattern pattern) { + return Pattern.typeOf(LogicalFilter.class).with(source(pattern)); + } + + /** + * Logical aggregate operator with a given pattern on inner field. + */ + public static Pattern aggregate(Pattern pattern) { + return Pattern.typeOf(LogicalAggregation.class).with(source(pattern)); + } + + /** + * Logical sort operator with a given pattern on inner field. + */ + public static Pattern sort(Pattern pattern) { + return Pattern.typeOf(LogicalSort.class).with(source(pattern)); + } + + /** + * Logical limit operator with a given pattern on inner field. + */ + public static Pattern limit(Pattern pattern) { + return Pattern.typeOf(LogicalLimit.class).with(source(pattern)); + } + + /** + * Logical project operator with a given pattern on inner field. + */ + public static Pattern project(Pattern pattern) { + return Pattern.typeOf(LogicalProject.class).with(source(pattern)); + } + + /** + * Pattern for {@link TableScanBuilder} and capture it meanwhile. + */ + public static Pattern scanBuilder() { + return Pattern.typeOf(TableScanBuilder.class).capturedAs(Capture.newCapture()); + } + /** * LogicalPlan source {@link Property}. */ @@ -25,4 +78,28 @@ public static Property source() { ? Optional.of(plan.getChild().get(0)) : Optional.empty()); } + + /** + * Source (children field) with a given pattern. + */ + @SuppressWarnings("unchecked") + public static + PropertyPattern source(Pattern pattern) { + Property property = Property.optionalProperty("source", + plan -> plan.getChild().size() == 1 + ? Optional.of((T) plan.getChild().get(0)) + : Optional.empty()); + + return property.matching(pattern); + } + + /** + * Logical relation with table field. + */ + public static Property table() { + return Property.optionalProperty("table", + plan -> plan instanceof LogicalRelation + ? Optional.of(((LogicalRelation) plan).getTable()) + : Optional.empty()); + } } diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java new file mode 100644 index 0000000000..845de5b890 --- /dev/null +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java @@ -0,0 +1,47 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.planner.optimizer.rule.scan; + +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.table; + +import com.facebook.presto.matching.Capture; +import com.facebook.presto.matching.Captures; +import com.facebook.presto.matching.Pattern; +import lombok.Getter; +import lombok.experimental.Accessors; +import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.logical.LogicalRelation; +import org.opensearch.sql.planner.optimizer.Rule; +import org.opensearch.sql.storage.Table; +import org.opensearch.sql.storage.TableScanBuilder; + +/** + * {@code RelationPushDown} defines a set of push down rules... + */ +public class CreateTableScanBuilder implements Rule { + + private final Capture capture; + + @Accessors(fluent = true) + @Getter + private final Pattern pattern; + + /** + * Construct create table scan builder rule. + */ + public CreateTableScanBuilder() { + this.capture = Capture.newCapture(); + this.pattern = Pattern.typeOf(LogicalRelation.class) + .with(table().capturedAs(capture)); + } + + @Override + public LogicalPlan apply(LogicalRelation plan, Captures captures) { + TableScanBuilder scanBuilder = captures.get(capture).createScanBuilder(); + // TODO: temporary check to avoid impact and separate Prometheus refactor work + return (scanBuilder == null) ? plan : scanBuilder; + } +} diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java new file mode 100644 index 0000000000..e493fa5af6 --- /dev/null +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java @@ -0,0 +1,119 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.planner.optimizer.rule.scan; + +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.aggregate; +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.filter; +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.limit; +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.project; +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.scanBuilder; +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.sort; +import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.TableScanPushDownBuilder.match; + +import com.facebook.presto.matching.Capture; +import com.facebook.presto.matching.Captures; +import com.facebook.presto.matching.Pattern; +import com.facebook.presto.matching.pattern.CapturePattern; +import com.facebook.presto.matching.pattern.WithPattern; +import java.util.function.BiFunction; +import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.optimizer.Rule; +import org.opensearch.sql.storage.TableScanBuilder; + +/** + * Base class for all table scan push down rules. + * + * @param logical plan node type + */ +public class TableScanPushDown implements Rule { + + /** Push down optimize rule for filtering condition. */ + public static final Rule PUSH_DOWN_FILTER = + match( + filter( + scanBuilder())) + .apply((filter, scanBuilder) -> scanBuilder.pushDownFilter(filter)); + + /** Push down optimize rule for aggregate operator. */ + public static final Rule PUSH_DOWN_AGGREGATION = + match( + aggregate( + scanBuilder())) + .apply((agg, scanBuilder) -> scanBuilder.pushDownAggregation(agg)); + + /** Push down optimize rule for sort operator. */ + public static final Rule PUSH_DOWN_SORT = + match( + sort( + scanBuilder())) + .apply((sort, scanBuilder) -> scanBuilder.pushDownSort(sort)); + + /** Push down optimize rule for limit operator. */ + public static final Rule PUSH_DOWN_LIMIT = + match( + limit( + scanBuilder())) + .apply((limit, scanBuilder) -> scanBuilder.pushDownLimit(limit)); + + public static final Rule PUSH_DOWN_PROJECT = + match( + project( + scanBuilder())) + .apply((project, scanBuilder) -> scanBuilder.pushDownProject(project)); + + + /** Pattern that matches a plan node. */ + private final WithPattern pattern; + + /** Capture table scan builder inside a plan node. */ + private final Capture capture; + + /** Push down function applied to the plan node and captured table scan builder. */ + private final BiFunction pushDownFunction; + + + @SuppressWarnings("unchecked") + private TableScanPushDown(WithPattern pattern, + BiFunction pushDownFunction) { + this.pattern = pattern; + this.capture = ((CapturePattern) pattern.getPattern()).capture(); + this.pushDownFunction = pushDownFunction; + } + + @Override + public Pattern pattern() { + return pattern; + } + + @Override + public LogicalPlan apply(T plan, Captures captures) { + TableScanBuilder scanBuilder = captures.get(capture); + if (pushDownFunction.apply(plan, scanBuilder)) { + return scanBuilder; + } + return plan; + } + + /** + * Custom builder class other than generated by Lombok to provide more readable code. + */ + static class TableScanPushDownBuilder { + + private WithPattern pattern; + + public static + TableScanPushDownBuilder match(Pattern pattern) { + TableScanPushDownBuilder builder = new TableScanPushDownBuilder<>(); + builder.pattern = (WithPattern) pattern; + return builder; + } + + public TableScanPushDown apply( + BiFunction pushDownFunction) { + return new TableScanPushDown<>(pattern, pushDownFunction); + } + } +} diff --git a/core/src/main/java/org/opensearch/sql/storage/Table.java b/core/src/main/java/org/opensearch/sql/storage/Table.java index 34e6ece30b..9c2812f8ba 100644 --- a/core/src/main/java/org/opensearch/sql/storage/Table.java +++ b/core/src/main/java/org/opensearch/sql/storage/Table.java @@ -44,7 +44,9 @@ default void create(Map schema) { * * @param plan logical plan * @return physical plan + * @deprecated replaced by write/scan builder */ + @Deprecated(since = "2.5") PhysicalPlan implement(LogicalPlan plan); /** @@ -53,9 +55,19 @@ default void create(Map schema) { * * @param plan logical plan. * @return logical plan. + * @deprecated replaced by write/scan builder */ + @Deprecated(since = "2.5") default LogicalPlan optimize(LogicalPlan plan) { return plan; } + /** + * Create table scan builder for logical to physical transformation. + * @return table scan builder + */ + default TableScanBuilder createScanBuilder() { + return null; // TODO: enforce all connector to create one for unified optimizing workflow + } + } diff --git a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java new file mode 100644 index 0000000000..24e812a1de --- /dev/null +++ b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java @@ -0,0 +1,64 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.storage; + +import java.util.Collections; +import org.opensearch.sql.planner.logical.LogicalAggregation; +import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalLimit; +import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.logical.LogicalPlanNodeVisitor; +import org.opensearch.sql.planner.logical.LogicalProject; +import org.opensearch.sql.planner.logical.LogicalSort; + +/** + * A {@code TableScanBuilder} represents transition state between logical planning + * and physical planning. + */ +public abstract class TableScanBuilder extends LogicalPlan { + + public TableScanBuilder() { + super(Collections.emptyList()); + } + + /** + * Build table scan operator. + * @return table scan operator + */ + public abstract TableScanOperator build(); + + /** + * Can a given filter be pushed down to table scan builder. Assume no such support + * by default unless subclass override this. + * + * @param filter filter node + * @return true if pushed down, otherwise false + */ + public boolean pushDownFilter(LogicalFilter filter) { + return false; + } + + public boolean pushDownAggregation(LogicalAggregation aggregation) { + return false; + } + + public boolean pushDownSort(LogicalSort sort) { + return false; + } + + public boolean pushDownLimit(LogicalLimit limit) { + return false; + } + + public boolean pushDownProject(LogicalProject project) { + return false; + } + + @Override + public R accept(LogicalPlanNodeVisitor visitor, C context) { + return visitor.visitScanBuilder(this, context); + } +} diff --git a/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java b/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java index 3a6a95764c..bcd39d28c3 100644 --- a/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java @@ -36,6 +36,7 @@ import org.junit.jupiter.api.Test; import org.junit.jupiter.api.extension.ExtendWith; import org.mockito.Mock; +import org.mockito.Mockito; import org.mockito.junit.jupiter.MockitoExtension; import org.opensearch.sql.ast.tree.RareTopN.CommandType; import org.opensearch.sql.ast.tree.Sort; @@ -55,6 +56,8 @@ import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.planner.physical.PhysicalPlanDSL; import org.opensearch.sql.storage.Table; +import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.TableScanOperator; @ExtendWith(MockitoExtension.class) class DefaultImplementorTest { @@ -197,4 +200,16 @@ public void visitWindowOperatorShouldReturnPhysicalWindowOperator() { assertEquals(physicalPlan, logicalPlan.accept(implementor, null)); } + + @Test + public void visitTableScanBuilderShouldBuildTableScanOperator() { + TableScanOperator tableScanOperator = Mockito.mock(TableScanOperator.class); + TableScanBuilder tableScanBuilder = new TableScanBuilder() { + @Override + public TableScanOperator build() { + return tableScanOperator; + } + }; + assertEquals(tableScanOperator, tableScanBuilder.accept(implementor, null)); + } } diff --git a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java index 03eeb9c626..654586c844 100644 --- a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java @@ -32,6 +32,8 @@ import org.opensearch.sql.expression.aggregation.Aggregator; import org.opensearch.sql.expression.window.WindowDefinition; import org.opensearch.sql.storage.Table; +import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.TableScanOperator; /** * Todo. Temporary added for UT coverage, Will be removed. @@ -72,6 +74,15 @@ public void testAbstractPlanNodeVisitorShouldReturnNull() { assertNull(relation.accept(new LogicalPlanNodeVisitor() { }, null)); + LogicalPlan tableScanBuilder = new TableScanBuilder() { + @Override + public TableScanOperator build() { + return null; + } + }; + assertNull(tableScanBuilder.accept(new LogicalPlanNodeVisitor() { + }, null)); + LogicalPlan filter = LogicalPlanDSL.filter(relation, expression); assertNull(filter.accept(new LogicalPlanNodeVisitor() { }, null)); diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java index 9f3035888f..4aba9efd10 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java @@ -7,29 +7,51 @@ package org.opensearch.sql.planner.optimizer; import static org.junit.jupiter.api.Assertions.assertEquals; +import static org.mockito.ArgumentMatchers.any; +import static org.mockito.Mockito.when; import static org.opensearch.sql.data.model.ExprValueUtils.integerValue; import static org.opensearch.sql.data.model.ExprValueUtils.longValue; import static org.opensearch.sql.data.type.ExprCoreType.INTEGER; import static org.opensearch.sql.data.type.ExprCoreType.LONG; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.aggregation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.filter; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.limit; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.sort; +import com.google.common.collect.ImmutableList; +import java.util.Map; import org.apache.commons.lang3.tuple.Pair; +import org.junit.jupiter.api.BeforeEach; import org.junit.jupiter.api.Test; import org.junit.jupiter.api.extension.ExtendWith; -import org.opensearch.sql.analysis.AnalyzerTestBase; +import org.mockito.Mock; +import org.mockito.Mockito; +import org.mockito.Spy; +import org.mockito.junit.jupiter.MockitoExtension; import org.opensearch.sql.ast.tree.Sort; +import org.opensearch.sql.data.type.ExprType; import org.opensearch.sql.expression.DSL; import org.opensearch.sql.planner.logical.LogicalPlan; -import org.springframework.context.annotation.Configuration; -import org.springframework.test.context.ContextConfiguration; -import org.springframework.test.context.junit.jupiter.SpringExtension; - -@Configuration -@ExtendWith(SpringExtension.class) -@ContextConfiguration(classes = {AnalyzerTestBase.class}) -class LogicalPlanOptimizerTest extends AnalyzerTestBase { +import org.opensearch.sql.planner.physical.PhysicalPlan; +import org.opensearch.sql.storage.Table; +import org.opensearch.sql.storage.TableScanBuilder; + +@ExtendWith(MockitoExtension.class) +class LogicalPlanOptimizerTest { + + @Mock + private Table table; + + @Spy + private TableScanBuilder tableScanBuilder; + + @BeforeEach + void setUp() { + when(table.createScanBuilder()).thenReturn(tableScanBuilder); + } + /** * Filter - Filter --> Filter. */ @@ -37,7 +59,7 @@ class LogicalPlanOptimizerTest extends AnalyzerTestBase { void filter_merge_filter() { assertEquals( filter( - relation("schema", table), + tableScanBuilder, DSL.and(DSL.equal(DSL.ref("integer_value", INTEGER), DSL.literal(integerValue(2))), DSL.equal(DSL.ref("integer_value", INTEGER), DSL.literal(integerValue(1)))) ), @@ -61,7 +83,7 @@ void push_filter_under_sort() { assertEquals( sort( filter( - relation("schema", table), + tableScanBuilder, DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) ), Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("longV", LONG)) @@ -86,7 +108,7 @@ void multiple_filter_should_eventually_be_merged() { assertEquals( sort( filter( - relation("schema", table), + tableScanBuilder, DSL.and(DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))), DSL.less(DSL.ref("longV", INTEGER), DSL.literal(longValue(1L)))) ), @@ -107,6 +129,130 @@ void multiple_filter_should_eventually_be_merged() { ); } + @Test + void default_table_scan_builder_should_not_push_down_anything() { + LogicalPlan[] plans = { + project( + relation("schema", table), + DSL.named("i", DSL.ref("intV", INTEGER)) + ), + filter( + relation("schema", table), + DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) + ), + aggregation( + relation("schema", table), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", DSL.ref("longV", LONG)))), + sort( + relation("schema", table), + Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("intV", INTEGER))), + limit( + relation("schema", table), + 1, 1) + }; + + for (LogicalPlan plan : plans) { + assertEquals(plan, optimize(plan)); + } + } + + @Test + void table_scan_builder_support_project_push_down_can_apply_its_rule() { + when(tableScanBuilder.pushDownProject(any())).thenReturn(true); + + assertEquals( + tableScanBuilder, + optimize( + project( + relation("schema", table), + DSL.named("i", DSL.ref("intV", INTEGER))) + ) + ); + } + + @Test + void table_scan_builder_support_filter_push_down_can_apply_its_rule() { + when(tableScanBuilder.pushDownFilter(any())).thenReturn(true); + + assertEquals( + tableScanBuilder, + optimize( + filter( + relation("schema", table), + DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1)))) + ) + ); + } + + @Test + void table_scan_builder_support_aggregation_push_down_can_apply_its_rule() { + when(tableScanBuilder.pushDownAggregation(any())).thenReturn(true); + + assertEquals( + tableScanBuilder, + optimize( + aggregation( + relation("schema", table), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", DSL.ref("longV", LONG)))) + ) + ); + } + + @Test + void table_scan_builder_support_sort_push_down_can_apply_its_rule() { + when(tableScanBuilder.pushDownSort(any())).thenReturn(true); + + assertEquals( + tableScanBuilder, + optimize( + sort( + relation("schema", table), + Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("intV", INTEGER))) + ) + ); + } + + @Test + void table_scan_builder_support_limit_push_down_can_apply_its_rule() { + when(tableScanBuilder.pushDownLimit(any())).thenReturn(true); + + assertEquals( + tableScanBuilder, + optimize( + limit( + relation("schema", table), + 1, 1) + ) + ); + } + + @Test + void table_not_support_scan_builder_should_not_be_impact() { + Mockito.reset(table, tableScanBuilder); + Table table = new Table() { + @Override + public Map getFieldTypes() { + return null; + } + + @Override + public PhysicalPlan implement(LogicalPlan plan) { + return null; + } + }; + + assertEquals( + relation("schema", table), + optimize(relation("schema", table)) + ); + } + private LogicalPlan optimize(LogicalPlan plan) { final LogicalPlanOptimizer optimizer = LogicalPlanOptimizer.create(); final LogicalPlan optimize = optimizer.optimize(plan); diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java index ad7c7c50dc..61d192362a 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java @@ -13,7 +13,9 @@ import org.junit.jupiter.api.Test; import org.junit.jupiter.api.extension.ExtendWith; import org.mockito.Mock; +import org.mockito.Mockito; import org.mockito.junit.jupiter.MockitoExtension; +import org.opensearch.sql.planner.logical.LogicalFilter; import org.opensearch.sql.planner.logical.LogicalPlan; @ExtendWith(MockitoExtension.class) @@ -26,5 +28,12 @@ class PatternsTest { void source_is_empty() { when(plan.getChild()).thenReturn(Collections.emptyList()); assertFalse(Patterns.source().getFunction().apply(plan).isPresent()); + assertFalse(Patterns.source(null).getProperty().getFunction().apply(plan).isPresent()); + } + + @Test + void table_is_empty() { + plan = Mockito.mock(LogicalFilter.class); + assertFalse(Patterns.table().getFunction().apply(plan).isPresent()); } } diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexAgg.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexAgg.java deleted file mode 100644 index 84bfb47a08..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexAgg.java +++ /dev/null @@ -1,80 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical; - -import com.google.common.collect.ImmutableList; -import java.util.List; -import lombok.Builder; -import lombok.EqualsAndHashCode; -import lombok.Getter; -import lombok.Setter; -import lombok.ToString; -import org.apache.commons.lang3.tuple.Pair; -import org.opensearch.sql.ast.tree.Sort; -import org.opensearch.sql.expression.Expression; -import org.opensearch.sql.expression.NamedExpression; -import org.opensearch.sql.expression.aggregation.NamedAggregator; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalPlanNodeVisitor; - -/** - * Logical Index Scan Aggregation Operation. - */ -@Getter -@ToString -@EqualsAndHashCode(callSuper = false) -public class OpenSearchLogicalIndexAgg extends LogicalPlan { - - private final String relationName; - - /** - * Filter Condition. - */ - @Setter - private Expression filter; - - /** - * Aggregation List. - */ - @Setter - private List aggregatorList; - - /** - * Group List. - */ - @Setter - private List groupByList; - - /** - * Sort List. - */ - @Setter - private List> sortList; - - /** - * ElasticsearchLogicalIndexAgg Constructor. - */ - @Builder - public OpenSearchLogicalIndexAgg( - String relationName, - Expression filter, - List aggregatorList, - List groupByList, - List> sortList) { - super(ImmutableList.of()); - this.relationName = relationName; - this.filter = filter; - this.aggregatorList = aggregatorList; - this.groupByList = groupByList; - this.sortList = sortList; - } - - @Override - public R accept(LogicalPlanNodeVisitor visitor, C context) { - return visitor.visitNode(this, context); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScan.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScan.java deleted file mode 100644 index d182b5f84d..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScan.java +++ /dev/null @@ -1,97 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical; - -import com.google.common.collect.ImmutableList; -import java.util.List; -import java.util.Set; -import lombok.Builder; -import lombok.EqualsAndHashCode; -import lombok.Getter; -import lombok.Setter; -import lombok.ToString; -import org.apache.commons.lang3.tuple.Pair; -import org.opensearch.sql.ast.tree.Sort; -import org.opensearch.sql.expression.Expression; -import org.opensearch.sql.expression.ReferenceExpression; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalPlanNodeVisitor; - -/** - * OpenSearch Logical Index Scan Operation. - */ -@Getter -@ToString -@EqualsAndHashCode(callSuper = false) -public class OpenSearchLogicalIndexScan extends LogicalPlan { - - /** - * Relation Name. - */ - private final String relationName; - - /** - * Filter Condition. - */ - @Setter - private Expression filter; - - /** - * Projection List. - */ - @Setter - private Set projectList; - - /** - * Sort List. - */ - @Setter - private List> sortList; - - @Setter - private Integer offset; - - @Setter - private Integer limit; - - /** - * ElasticsearchLogicalIndexScan Constructor. - */ - @Builder - public OpenSearchLogicalIndexScan( - String relationName, - Expression filter, - Set projectList, - List> sortList, - Integer limit, Integer offset) { - super(ImmutableList.of()); - this.relationName = relationName; - this.filter = filter; - this.projectList = projectList; - this.sortList = sortList; - this.limit = limit; - this.offset = offset; - } - - @Override - public R accept(LogicalPlanNodeVisitor visitor, C context) { - return visitor.visitNode(this, context); - } - - public boolean hasLimit() { - return limit != null; - } - - /** - * Test has projects or not. - * - * @return true for has projects, otherwise false. - */ - public boolean hasProjects() { - return projectList != null && !projectList.isEmpty(); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalPlanOptimizerFactory.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalPlanOptimizerFactory.java deleted file mode 100644 index 77cb6b13bd..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalPlanOptimizerFactory.java +++ /dev/null @@ -1,47 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical; - -import java.util.Arrays; -import lombok.experimental.UtilityClass; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeAggAndIndexScan; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeAggAndRelation; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeFilterAndRelation; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeLimitAndIndexScan; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeLimitAndRelation; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeSortAndIndexAgg; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeSortAndIndexScan; -import org.opensearch.sql.opensearch.planner.logical.rule.MergeSortAndRelation; -import org.opensearch.sql.opensearch.planner.logical.rule.PushProjectAndIndexScan; -import org.opensearch.sql.opensearch.planner.logical.rule.PushProjectAndRelation; -import org.opensearch.sql.planner.optimizer.LogicalPlanOptimizer; - -/** - * OpenSearch storage specified logical plan optimizer. - */ -@UtilityClass -public class OpenSearchLogicalPlanOptimizerFactory { - - /** - * Create OpenSearch storage specified logical plan optimizer. - */ - public static LogicalPlanOptimizer create() { - return new LogicalPlanOptimizer(Arrays.asList( - new MergeFilterAndRelation(), - new MergeAggAndIndexScan(), - new MergeAggAndRelation(), - new MergeSortAndRelation(), - new MergeSortAndIndexScan(), - new MergeSortAndIndexAgg(), - new MergeSortAndIndexScan(), - new MergeLimitAndRelation(), - new MergeLimitAndIndexScan(), - new PushProjectAndRelation(), - new PushProjectAndIndexScan() - )); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndIndexScan.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndIndexScan.java deleted file mode 100644 index 3d4d999d12..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndIndexScan.java +++ /dev/null @@ -1,57 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import lombok.Getter; -import lombok.experimental.Accessors; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexAgg; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalAggregation; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Merge Aggregation -- Relation to IndexScanAggregation. - */ -public class MergeAggAndIndexScan implements Rule { - - private final Capture capture; - - @Accessors(fluent = true) - @Getter - private final Pattern pattern; - - /** - * Constructor of MergeAggAndIndexScan. - */ - public MergeAggAndIndexScan() { - this.capture = Capture.newCapture(); - this.pattern = typeOf(LogicalAggregation.class) - .with(source().matching(typeOf(OpenSearchLogicalIndexScan.class) - .matching(indexScan -> !indexScan.hasLimit()) - .capturedAs(capture))); - } - - @Override - public LogicalPlan apply(LogicalAggregation aggregation, - Captures captures) { - OpenSearchLogicalIndexScan indexScan = captures.get(capture); - return OpenSearchLogicalIndexAgg - .builder() - .relationName(indexScan.getRelationName()) - .filter(indexScan.getFilter()) - .aggregatorList(aggregation.getAggregatorList()) - .groupByList(aggregation.getGroupByList()) - .build(); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndRelation.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndRelation.java deleted file mode 100644 index 2e79e7c51a..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeAggAndRelation.java +++ /dev/null @@ -1,54 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import lombok.Getter; -import lombok.experimental.Accessors; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexAgg; -import org.opensearch.sql.planner.logical.LogicalAggregation; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalRelation; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Merge Aggregation -- Relation to IndexScanAggregation. - */ -public class MergeAggAndRelation implements Rule { - - private final Capture relationCapture; - - @Accessors(fluent = true) - @Getter - private final Pattern pattern; - - /** - * Constructor of MergeAggAndRelation. - */ - public MergeAggAndRelation() { - this.relationCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalAggregation.class) - .with(source().matching(typeOf(LogicalRelation.class).capturedAs(relationCapture))); - } - - @Override - public LogicalPlan apply(LogicalAggregation aggregation, - Captures captures) { - LogicalRelation relation = captures.get(relationCapture); - return OpenSearchLogicalIndexAgg - .builder() - .relationName(relation.getRelationName()) - .aggregatorList(aggregation.getAggregatorList()) - .groupByList(aggregation.getGroupByList()) - .build(); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeFilterAndRelation.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeFilterAndRelation.java deleted file mode 100644 index 19143c390e..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeFilterAndRelation.java +++ /dev/null @@ -1,53 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalFilter; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalRelation; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Merge Filter -- Relation to LogicalIndexScan. - */ -public class MergeFilterAndRelation implements Rule { - - private final Capture relationCapture; - private final Pattern pattern; - - /** - * Constructor of MergeFilterAndRelation. - */ - public MergeFilterAndRelation() { - this.relationCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalFilter.class) - .with(source().matching(typeOf(LogicalRelation.class).capturedAs(relationCapture))); - } - - @Override - public Pattern pattern() { - return pattern; - } - - @Override - public LogicalPlan apply(LogicalFilter filter, - Captures captures) { - LogicalRelation relation = captures.get(relationCapture); - return OpenSearchLogicalIndexScan - .builder() - .relationName(relation.getRelationName()) - .filter(filter.getCondition()) - .build(); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndIndexScan.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndIndexScan.java deleted file mode 100644 index 9d880bb4dc..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndIndexScan.java +++ /dev/null @@ -1,54 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import lombok.Getter; -import lombok.experimental.Accessors; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalLimit; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.optimizer.Rule; - -@Getter -public class MergeLimitAndIndexScan implements Rule { - - private final Capture indexScanCapture; - - @Accessors(fluent = true) - private final Pattern pattern; - - /** - * Constructor of MergeLimitAndIndexScan. - */ - public MergeLimitAndIndexScan() { - this.indexScanCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalLimit.class) - .with(source() - .matching(typeOf(OpenSearchLogicalIndexScan.class).capturedAs(indexScanCapture))); - } - - @Override - public LogicalPlan apply(LogicalLimit plan, Captures captures) { - OpenSearchLogicalIndexScan indexScan = captures.get(indexScanCapture); - OpenSearchLogicalIndexScan.OpenSearchLogicalIndexScanBuilder builder = - OpenSearchLogicalIndexScan.builder(); - builder.relationName(indexScan.getRelationName()) - .filter(indexScan.getFilter()) - .offset(plan.getOffset()) - .limit(plan.getLimit()); - if (indexScan.getSortList() != null) { - builder.sortList(indexScan.getSortList()); - } - return builder.build(); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndRelation.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndRelation.java deleted file mode 100644 index 8a170aaa4a..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeLimitAndRelation.java +++ /dev/null @@ -1,49 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import lombok.Getter; -import lombok.experimental.Accessors; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalLimit; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalRelation; -import org.opensearch.sql.planner.optimizer.Rule; - -@Getter -public class MergeLimitAndRelation implements Rule { - - private final Capture relationCapture; - - @Accessors(fluent = true) - private final Pattern pattern; - - /** - * Constructor of MergeLimitAndRelation. - */ - public MergeLimitAndRelation() { - this.relationCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalLimit.class) - .with(source().matching(typeOf(LogicalRelation.class).capturedAs(relationCapture))); - } - - @Override - public LogicalPlan apply(LogicalLimit plan, Captures captures) { - LogicalRelation relation = captures.get(relationCapture); - return OpenSearchLogicalIndexScan.builder() - .relationName(relation.getRelationName()) - .offset(plan.getOffset()) - .limit(plan.getLimit()) - .build(); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexAgg.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexAgg.java deleted file mode 100644 index 57dac4dcf1..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexAgg.java +++ /dev/null @@ -1,82 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import java.util.Set; -import java.util.concurrent.atomic.AtomicReference; -import java.util.stream.Collectors; -import lombok.Getter; -import lombok.experimental.Accessors; -import org.apache.commons.lang3.tuple.Pair; -import org.opensearch.sql.ast.tree.Sort; -import org.opensearch.sql.expression.Expression; -import org.opensearch.sql.expression.ReferenceExpression; -import org.opensearch.sql.expression.aggregation.NamedAggregator; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexAgg; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalSort; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Merge Sort -- IndexScanAggregation to IndexScanAggregation. - */ -public class MergeSortAndIndexAgg implements Rule { - - private final Capture indexAggCapture; - - @Accessors(fluent = true) - @Getter - private final Pattern pattern; - - /** - * Constructor of MergeAggAndIndexScan. - */ - public MergeSortAndIndexAgg() { - this.indexAggCapture = Capture.newCapture(); - final AtomicReference sortRef = new AtomicReference<>(); - - this.pattern = typeOf(LogicalSort.class) - .matching(OptimizationRuleUtils::sortByFieldsOnly) - .matching(sort -> { - sortRef.set(sort); - return true; - }) - .with(source().matching(typeOf(OpenSearchLogicalIndexAgg.class) - .matching(indexAgg -> !hasAggregatorInSortBy(sortRef.get(), indexAgg)) - .capturedAs(indexAggCapture))); - } - - @Override - public LogicalPlan apply(LogicalSort sort, - Captures captures) { - OpenSearchLogicalIndexAgg indexAgg = captures.get(indexAggCapture); - return OpenSearchLogicalIndexAgg.builder() - .relationName(indexAgg.getRelationName()) - .filter(indexAgg.getFilter()) - .groupByList(indexAgg.getGroupByList()) - .aggregatorList(indexAgg.getAggregatorList()) - .sortList(sort.getSortList()) - .build(); - } - - private boolean hasAggregatorInSortBy(LogicalSort sort, OpenSearchLogicalIndexAgg agg) { - final Set aggregatorNames = - agg.getAggregatorList().stream().map(NamedAggregator::getName).collect(Collectors.toSet()); - for (Pair sortPair : sort.getSortList()) { - if (aggregatorNames.contains(((ReferenceExpression) sortPair.getRight()).getAttr())) { - return true; - } - } - return false; - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexScan.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexScan.java deleted file mode 100644 index 337f09308c..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndIndexScan.java +++ /dev/null @@ -1,70 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import java.util.List; -import java.util.stream.Collectors; -import java.util.stream.Stream; -import org.apache.commons.lang3.tuple.Pair; -import org.opensearch.sql.ast.tree.Sort; -import org.opensearch.sql.expression.Expression; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalSort; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Merge Sort with IndexScan only when Sort by fields. - */ -public class MergeSortAndIndexScan implements Rule { - - private final Capture indexScanCapture; - private final Pattern pattern; - - /** - * Constructor of MergeSortAndRelation. - */ - public MergeSortAndIndexScan() { - this.indexScanCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalSort.class).matching(OptimizationRuleUtils::sortByFieldsOnly) - .with(source() - .matching(typeOf(OpenSearchLogicalIndexScan.class).capturedAs(indexScanCapture))); - } - - @Override - public Pattern pattern() { - return pattern; - } - - @Override - public LogicalPlan apply(LogicalSort sort, - Captures captures) { - OpenSearchLogicalIndexScan indexScan = captures.get(indexScanCapture); - - return OpenSearchLogicalIndexScan - .builder() - .relationName(indexScan.getRelationName()) - .filter(indexScan.getFilter()) - .sortList(mergeSortList(indexScan.getSortList(), sort.getSortList())) - .build(); - } - - private List> mergeSortList(List> l1, List> l2) { - if (null == l1) { - return l2; - } else { - return Stream.concat(l1.stream(), l2.stream()).collect(Collectors.toList()); - } - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndRelation.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndRelation.java deleted file mode 100644 index 3ba3c7f645..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/MergeSortAndRelation.java +++ /dev/null @@ -1,53 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalRelation; -import org.opensearch.sql.planner.logical.LogicalSort; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Merge Sort with Relation only when Sort by fields. - */ -public class MergeSortAndRelation implements Rule { - - private final Capture relationCapture; - private final Pattern pattern; - - /** - * Constructor of MergeSortAndRelation. - */ - public MergeSortAndRelation() { - this.relationCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalSort.class).matching(OptimizationRuleUtils::sortByFieldsOnly) - .with(source().matching(typeOf(LogicalRelation.class).capturedAs(relationCapture))); - } - - @Override - public Pattern pattern() { - return pattern; - } - - @Override - public LogicalPlan apply(LogicalSort sort, - Captures captures) { - LogicalRelation relation = captures.get(relationCapture); - return OpenSearchLogicalIndexScan - .builder() - .relationName(relation.getRelationName()) - .sortList(sort.getSortList()) - .build(); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/OptimizationRuleUtils.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/OptimizationRuleUtils.java deleted file mode 100644 index aa1ffa9e4c..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/OptimizationRuleUtils.java +++ /dev/null @@ -1,66 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import java.util.ArrayList; -import java.util.HashSet; -import java.util.List; -import java.util.Set; -import lombok.experimental.UtilityClass; -import org.opensearch.sql.expression.ExpressionNodeVisitor; -import org.opensearch.sql.expression.NamedExpression; -import org.opensearch.sql.expression.ReferenceExpression; -import org.opensearch.sql.planner.logical.LogicalSort; - -@UtilityClass -public class OptimizationRuleUtils { - - /** - * Does the sort list only contain {@link ReferenceExpression}. - * - * @param logicalSort LogicalSort. - * @return true only contain ReferenceExpression, otherwise false. - */ - public static boolean sortByFieldsOnly(LogicalSort logicalSort) { - return logicalSort.getSortList().stream() - .map(sort -> sort.getRight() instanceof ReferenceExpression) - .reduce(true, Boolean::logicalAnd); - } - - /** - * Find reference expression from expression. - * @param expressions a list of expression. - * - * @return a list of ReferenceExpression - */ - public static Set findReferenceExpressions( - List expressions) { - Set projectList = new HashSet<>(); - for (NamedExpression namedExpression : expressions) { - projectList.addAll(findReferenceExpression(namedExpression)); - } - return projectList; - } - - /** - * Find reference expression from expression. - * @param expression expression. - * - * @return a list of ReferenceExpression - */ - public static List findReferenceExpression( - NamedExpression expression) { - List results = new ArrayList<>(); - expression.accept(new ExpressionNodeVisitor() { - @Override - public Object visitReference(ReferenceExpression node, Object context) { - return results.add(node); - } - }, null); - return results; - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndIndexScan.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndIndexScan.java deleted file mode 100644 index 43714282fb..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndIndexScan.java +++ /dev/null @@ -1,63 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.opensearch.planner.logical.rule.OptimizationRuleUtils.findReferenceExpressions; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import java.util.Set; -import org.opensearch.sql.expression.ReferenceExpression; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalProject; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Push Project list into ElasticsearchLogicalIndexScan. - */ -public class PushProjectAndIndexScan implements Rule { - - private final Capture indexScanCapture; - - private final Pattern pattern; - - private Set pushDownProjects; - - /** - * Constructor of MergeProjectAndIndexScan. - */ - public PushProjectAndIndexScan() { - this.indexScanCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalProject.class).matching( - project -> { - pushDownProjects = findReferenceExpressions(project.getProjectList()); - return !pushDownProjects.isEmpty(); - }).with(source() - .matching(typeOf(OpenSearchLogicalIndexScan.class) - .matching(indexScan -> !indexScan.hasProjects()) - .capturedAs(indexScanCapture))); - - } - - @Override - public Pattern pattern() { - return pattern; - } - - @Override - public LogicalPlan apply(LogicalProject project, - Captures captures) { - OpenSearchLogicalIndexScan indexScan = captures.get(indexScanCapture); - indexScan.setProjectList(pushDownProjects); - return new LogicalProject(indexScan, project.getProjectList(), - project.getNamedParseExpressions()); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndRelation.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndRelation.java deleted file mode 100644 index a29a1df466..0000000000 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/planner/logical/rule/PushProjectAndRelation.java +++ /dev/null @@ -1,67 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical.rule; - -import static com.facebook.presto.matching.Pattern.typeOf; -import static org.opensearch.sql.opensearch.planner.logical.rule.OptimizationRuleUtils.findReferenceExpressions; -import static org.opensearch.sql.planner.optimizer.pattern.Patterns.source; - -import com.facebook.presto.matching.Capture; -import com.facebook.presto.matching.Captures; -import com.facebook.presto.matching.Pattern; -import java.util.Set; -import org.opensearch.sql.expression.ReferenceExpression; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalProject; -import org.opensearch.sql.planner.logical.LogicalRelation; -import org.opensearch.sql.planner.optimizer.Rule; - -/** - * Push Project list into Relation. The transformed plan is Project - IndexScan - */ -public class PushProjectAndRelation implements Rule { - - private final Capture relationCapture; - - private final Pattern pattern; - - private Set pushDownProjects; - - /** - * Constructor of MergeProjectAndRelation. - */ - public PushProjectAndRelation() { - this.relationCapture = Capture.newCapture(); - this.pattern = typeOf(LogicalProject.class) - .matching(project -> { - pushDownProjects = findReferenceExpressions(project.getProjectList()); - return !pushDownProjects.isEmpty(); - }) - .with(source().matching(typeOf(LogicalRelation.class).capturedAs(relationCapture))); - } - - @Override - public Pattern pattern() { - return pattern; - } - - @Override - public LogicalPlan apply(LogicalProject project, - Captures captures) { - LogicalRelation relation = captures.get(relationCapture); - return new LogicalProject( - OpenSearchLogicalIndexScan - .builder() - .relationName(relation.getRelationName()) - .projectList(findReferenceExpressions(project.getProjectList())) - .build(), - project.getProjectList(), - project.getNamedParseExpressions() - ); - } -} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/CompositeAggregationParser.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/CompositeAggregationParser.java index 00e8a5154c..7459300caa 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/CompositeAggregationParser.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/CompositeAggregationParser.java @@ -18,12 +18,14 @@ import java.util.List; import java.util.Map; import java.util.stream.Collectors; +import lombok.EqualsAndHashCode; import org.opensearch.search.aggregations.Aggregations; import org.opensearch.search.aggregations.bucket.composite.CompositeAggregation; /** * Composite Aggregation Parser which include composite aggregation and metric parsers. */ +@EqualsAndHashCode public class CompositeAggregationParser implements OpenSearchAggregationResponseParser { private final MetricParserHelper metricsParser; diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/FilterParser.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/FilterParser.java index cfcba82c18..8358379be0 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/FilterParser.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/FilterParser.java @@ -15,6 +15,7 @@ import java.util.Map; import lombok.Builder; +import lombok.EqualsAndHashCode; import lombok.Getter; import org.opensearch.search.aggregations.Aggregation; import org.opensearch.search.aggregations.bucket.filter.Filter; @@ -25,6 +26,7 @@ * do nothing and return the result from metricsParser. */ @Builder +@EqualsAndHashCode public class FilterParser implements MetricParser { private final MetricParser metricsParser; diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/MetricParserHelper.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/MetricParserHelper.java index 54b9305f49..d5c0141ad2 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/MetricParserHelper.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/MetricParserHelper.java @@ -17,6 +17,7 @@ import java.util.List; import java.util.Map; import java.util.stream.Collectors; +import lombok.EqualsAndHashCode; import lombok.RequiredArgsConstructor; import org.opensearch.search.aggregations.Aggregation; import org.opensearch.search.aggregations.Aggregations; @@ -25,6 +26,7 @@ /** * Parse multiple metrics in one bucket. */ +@EqualsAndHashCode @RequiredArgsConstructor public class MetricParserHelper { diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/SingleValueParser.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/SingleValueParser.java index 88d9604137..384e07ad8f 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/SingleValueParser.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/SingleValueParser.java @@ -17,6 +17,7 @@ import java.util.Collections; import java.util.Map; +import lombok.EqualsAndHashCode; import lombok.Getter; import lombok.RequiredArgsConstructor; import org.opensearch.search.aggregations.Aggregation; @@ -25,6 +26,7 @@ /** * {@link NumericMetricsAggregation.SingleValue} metric parser. */ +@EqualsAndHashCode @RequiredArgsConstructor public class SingleValueParser implements MetricParser { diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/StatsParser.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/StatsParser.java index 5928b7efc9..c80b75de05 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/StatsParser.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/StatsParser.java @@ -18,6 +18,7 @@ import java.util.Collections; import java.util.Map; import java.util.function.Function; +import lombok.EqualsAndHashCode; import lombok.Getter; import lombok.RequiredArgsConstructor; import org.opensearch.search.aggregations.Aggregation; @@ -26,6 +27,7 @@ /** * {@link ExtendedStats} metric parser. */ +@EqualsAndHashCode @RequiredArgsConstructor public class StatsParser implements MetricParser { diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/TopHitsParser.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/TopHitsParser.java index 4a3a346a84..a98e1b4ce3 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/TopHitsParser.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/response/agg/TopHitsParser.java @@ -10,6 +10,7 @@ import java.util.Collections; import java.util.Map; import java.util.stream.Collectors; +import lombok.EqualsAndHashCode; import lombok.Getter; import lombok.RequiredArgsConstructor; import org.opensearch.search.aggregations.Aggregation; @@ -18,6 +19,7 @@ /** * {@link TopHits} metric parser. */ +@EqualsAndHashCode @RequiredArgsConstructor public class TopHitsParser implements MetricParser { diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java index 26082abed1..ada6341def 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java @@ -8,41 +8,29 @@ import com.google.common.annotations.VisibleForTesting; import java.util.HashMap; -import java.util.List; import java.util.Map; -import java.util.stream.Collectors; import lombok.RequiredArgsConstructor; -import org.apache.commons.lang3.tuple.Pair; -import org.opensearch.index.query.QueryBuilder; -import org.opensearch.search.aggregations.AggregationBuilder; import org.opensearch.sql.common.setting.Settings; import org.opensearch.sql.common.utils.StringUtils; import org.opensearch.sql.data.type.ExprType; import org.opensearch.sql.opensearch.client.OpenSearchClient; import org.opensearch.sql.opensearch.data.type.OpenSearchDataType; import org.opensearch.sql.opensearch.data.value.OpenSearchExprValueFactory; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexAgg; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalPlanOptimizerFactory; import org.opensearch.sql.opensearch.planner.physical.ADOperator; import org.opensearch.sql.opensearch.planner.physical.MLCommonsOperator; import org.opensearch.sql.opensearch.planner.physical.MLOperator; import org.opensearch.sql.opensearch.request.OpenSearchRequest; import org.opensearch.sql.opensearch.request.system.OpenSearchDescribeIndexRequest; -import org.opensearch.sql.opensearch.response.agg.OpenSearchAggregationResponseParser; -import org.opensearch.sql.opensearch.storage.script.aggregation.AggregationQueryBuilder; -import org.opensearch.sql.opensearch.storage.script.filter.FilterQueryBuilder; -import org.opensearch.sql.opensearch.storage.script.sort.SortQueryBuilder; -import org.opensearch.sql.opensearch.storage.serialization.DefaultExpressionSerializer; +import org.opensearch.sql.opensearch.storage.scan.OpenSearchIndexScanBuilder; import org.opensearch.sql.planner.DefaultImplementor; import org.opensearch.sql.planner.logical.LogicalAD; import org.opensearch.sql.planner.logical.LogicalHighlight; import org.opensearch.sql.planner.logical.LogicalML; import org.opensearch.sql.planner.logical.LogicalMLCommons; import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.logical.LogicalRelation; import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.storage.Table; +import org.opensearch.sql.storage.TableScanBuilder; /** OpenSearch table (index) implementation. */ public class OpenSearchIndex implements Table { @@ -122,98 +110,31 @@ public Integer getMaxResultWindow() { */ @Override public PhysicalPlan implement(LogicalPlan plan) { - OpenSearchIndexScan indexScan = new OpenSearchIndexScan(client, settings, indexName, - getMaxResultWindow(), new OpenSearchExprValueFactory(getFieldTypes())); - - /* - * Visit logical plan with index scan as context so logical operators visited, such as - * aggregation, filter, will accumulate (push down) OpenSearch query and aggregation DSL on - * index scan. - */ - return plan.accept(new OpenSearchDefaultImplementor(indexScan, client), indexScan); + // TODO: deprecate this and move to Planner. For now leave it here to + // avoid impact Prometheus optimize/implement logic + return plan.accept(new OpenSearchDefaultImplementor(client), null); } @Override public LogicalPlan optimize(LogicalPlan plan) { - return OpenSearchLogicalPlanOptimizerFactory.create().optimize(plan); + // No-op because optimization already done in Planner + return plan; + } + + @Override + public TableScanBuilder createScanBuilder() { + OpenSearchIndexScan indexScan = new OpenSearchIndexScan(client, settings, indexName, + getMaxResultWindow(), new OpenSearchExprValueFactory(getFieldTypes())); + return new OpenSearchIndexScanBuilder(indexScan); } @VisibleForTesting @RequiredArgsConstructor public static class OpenSearchDefaultImplementor extends DefaultImplementor { - private final OpenSearchIndexScan indexScan; private final OpenSearchClient client; - @Override - public PhysicalPlan visitNode(LogicalPlan plan, OpenSearchIndexScan context) { - if (plan instanceof OpenSearchLogicalIndexScan) { - return visitIndexScan((OpenSearchLogicalIndexScan) plan, context); - } else if (plan instanceof OpenSearchLogicalIndexAgg) { - return visitIndexAggregation((OpenSearchLogicalIndexAgg) plan, context); - } else { - throw new IllegalStateException(StringUtils.format("unexpected plan node type %s", - plan.getClass())); - } - } - - /** - * Implement ElasticsearchLogicalIndexScan. - */ - public PhysicalPlan visitIndexScan(OpenSearchLogicalIndexScan node, - OpenSearchIndexScan context) { - if (null != node.getSortList()) { - final SortQueryBuilder builder = new SortQueryBuilder(); - context.getRequestBuilder().pushDownSort(node.getSortList().stream() - .map(sort -> builder.build(sort.getValue(), sort.getKey())) - .collect(Collectors.toList())); - } - - if (null != node.getFilter()) { - FilterQueryBuilder queryBuilder = new FilterQueryBuilder(new DefaultExpressionSerializer()); - QueryBuilder query = queryBuilder.build(node.getFilter()); - context.getRequestBuilder().pushDown(query); - } - - if (node.getLimit() != null) { - context.getRequestBuilder().pushDownLimit(node.getLimit(), node.getOffset()); - } - - if (node.hasProjects()) { - context.getRequestBuilder().pushDownProjects(node.getProjectList()); - } - return indexScan; - } - - /** - * Implement ElasticsearchLogicalIndexAgg. - */ - public PhysicalPlan visitIndexAggregation(OpenSearchLogicalIndexAgg node, - OpenSearchIndexScan context) { - if (node.getFilter() != null) { - FilterQueryBuilder queryBuilder = new FilterQueryBuilder( - new DefaultExpressionSerializer()); - QueryBuilder query = queryBuilder.build(node.getFilter()); - context.getRequestBuilder().pushDown(query); - } - AggregationQueryBuilder builder = - new AggregationQueryBuilder(new DefaultExpressionSerializer()); - Pair, OpenSearchAggregationResponseParser> aggregationBuilder = - builder.buildAggregationBuilder(node.getAggregatorList(), - node.getGroupByList(), node.getSortList()); - context.getRequestBuilder().pushDownAggregation(aggregationBuilder); - context.getRequestBuilder().pushTypeMapping( - builder.buildTypeMapping(node.getAggregatorList(), - node.getGroupByList())); - return indexScan; - } - - @Override - public PhysicalPlan visitRelation(LogicalRelation node, OpenSearchIndexScan context) { - return indexScan; - } - @Override public PhysicalPlan visitMLCommons(LogicalMLCommons node, OpenSearchIndexScan context) { return new MLCommonsOperator(visitChild(node, context), node.getAlgorithm(), diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchAggregateIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchAggregateIndexScanBuilder.java new file mode 100644 index 0000000000..95ece2939a --- /dev/null +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchAggregateIndexScanBuilder.java @@ -0,0 +1,98 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.opensearch.storage.scan; + +import java.util.List; +import java.util.Set; +import java.util.stream.Collectors; +import org.apache.commons.lang3.tuple.Pair; +import org.opensearch.search.aggregations.AggregationBuilder; +import org.opensearch.sql.ast.tree.Sort; +import org.opensearch.sql.expression.Expression; +import org.opensearch.sql.expression.NamedExpression; +import org.opensearch.sql.expression.ReferenceExpression; +import org.opensearch.sql.expression.aggregation.NamedAggregator; +import org.opensearch.sql.opensearch.response.agg.OpenSearchAggregationResponseParser; +import org.opensearch.sql.opensearch.storage.OpenSearchIndexScan; +import org.opensearch.sql.opensearch.storage.script.aggregation.AggregationQueryBuilder; +import org.opensearch.sql.opensearch.storage.serialization.DefaultExpressionSerializer; +import org.opensearch.sql.planner.logical.LogicalAggregation; +import org.opensearch.sql.planner.logical.LogicalSort; +import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.TableScanOperator; + +/** + * Index scan builder for aggregate query used by {@link OpenSearchIndexScanBuilder} internally. + */ +class OpenSearchAggregateIndexScanBuilder extends TableScanBuilder { + + /** OpenSearch index scan to be optimized. */ + private final OpenSearchIndexScan indexScan; + + /** Aggregators pushed down. */ + private List aggregatorList; + + /** Grouping items pushed down. */ + private List groupByList; + + /** Sorting items pushed down. */ + private List> sortList; + + /** + * Initialize with given index scan and perform push-down optimization later. + * + * @param indexScan index scan not fully optimized yet + */ + OpenSearchAggregateIndexScanBuilder(OpenSearchIndexScan indexScan) { + this.indexScan = indexScan; + } + + @Override + public TableScanOperator build() { + AggregationQueryBuilder builder = + new AggregationQueryBuilder(new DefaultExpressionSerializer()); + Pair, OpenSearchAggregationResponseParser> aggregationBuilder = + builder.buildAggregationBuilder(aggregatorList, groupByList, sortList); + indexScan.getRequestBuilder().pushDownAggregation(aggregationBuilder); + indexScan.getRequestBuilder().pushTypeMapping( + builder.buildTypeMapping(aggregatorList, groupByList)); + return indexScan; + } + + @Override + public boolean pushDownAggregation(LogicalAggregation aggregation) { + aggregatorList = aggregation.getAggregatorList(); + groupByList = aggregation.getGroupByList(); + return true; + } + + @Override + public boolean pushDownSort(LogicalSort sort) { + if (!sortByFieldsOnly(sort) || hasAggregatorInSortBy(sort)) { + return false; + } + + sortList = sort.getSortList(); + return true; + } + + private boolean sortByFieldsOnly(LogicalSort sort) { + return sort.getSortList().stream() + .map(sortItem -> sortItem.getRight() instanceof ReferenceExpression) + .reduce(true, Boolean::logicalAnd); + } + + private boolean hasAggregatorInSortBy(LogicalSort sort) { + final Set aggregatorNames = + aggregatorList.stream().map(NamedAggregator::getName).collect(Collectors.toSet()); + for (Pair sortPair : sort.getSortList()) { + if (aggregatorNames.contains(((ReferenceExpression) sortPair.getRight()).getAttr())) { + return true; + } + } + return false; + } +} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java new file mode 100644 index 0000000000..9b34f78d5d --- /dev/null +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java @@ -0,0 +1,87 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.opensearch.storage.scan; + +import com.google.common.annotations.VisibleForTesting; +import lombok.EqualsAndHashCode; +import org.opensearch.sql.opensearch.storage.OpenSearchIndexScan; +import org.opensearch.sql.planner.logical.LogicalAggregation; +import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalLimit; +import org.opensearch.sql.planner.logical.LogicalProject; +import org.opensearch.sql.planner.logical.LogicalSort; +import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.TableScanOperator; + +/** + * Table scan builder that builds table scan operator for OpenSearch. The actual work is performed + * by delegated builder internally. This is to avoid conditional check of different push down logic + * for non-aggregate and aggregate query everywhere. + */ +public class OpenSearchIndexScanBuilder extends TableScanBuilder { + + /** + * Delegated index scan builder for non-aggregate or aggregate query. + */ + @EqualsAndHashCode.Include + private TableScanBuilder delegate; + + @VisibleForTesting + OpenSearchIndexScanBuilder(TableScanBuilder delegate) { + this.delegate = delegate; + } + + /** + * Initialize with given index scan. + * + * @param indexScan index scan to optimize + */ + public OpenSearchIndexScanBuilder(OpenSearchIndexScan indexScan) { + this.delegate = new OpenSearchSimpleIndexScanBuilder(indexScan); + } + + @Override + public TableScanOperator build() { + return delegate.build(); + } + + @Override + public boolean pushDownFilter(LogicalFilter filter) { + return delegate.pushDownFilter(filter); + } + + @Override + public boolean pushDownAggregation(LogicalAggregation aggregation) { + // Switch to builder for aggregate query which has different push down logic + // for later filter, sort and limit operator. Change back if unable to push + // down aggregation. + TableScanBuilder oldDelegate = delegate; + delegate = new OpenSearchAggregateIndexScanBuilder( + (OpenSearchIndexScan) delegate.build()); + + if (delegate.pushDownAggregation(aggregation)) { + return true; + } else { + delegate = oldDelegate; + return false; + } + } + + @Override + public boolean pushDownSort(LogicalSort sort) { + return delegate.pushDownSort(sort); + } + + @Override + public boolean pushDownLimit(LogicalLimit limit) { + return delegate.pushDownLimit(limit); + } + + @Override + public boolean pushDownProject(LogicalProject project) { + return delegate.pushDownProject(project); + } +} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java new file mode 100644 index 0000000000..f8450112ed --- /dev/null +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java @@ -0,0 +1,133 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.opensearch.storage.scan; + +import com.google.common.annotations.VisibleForTesting; +import java.util.ArrayList; +import java.util.HashSet; +import java.util.List; +import java.util.Set; +import java.util.stream.Collectors; +import lombok.EqualsAndHashCode; +import org.apache.commons.lang3.tuple.Pair; +import org.opensearch.index.query.QueryBuilder; +import org.opensearch.sql.ast.tree.Sort; +import org.opensearch.sql.expression.Expression; +import org.opensearch.sql.expression.ExpressionNodeVisitor; +import org.opensearch.sql.expression.NamedExpression; +import org.opensearch.sql.expression.ReferenceExpression; +import org.opensearch.sql.opensearch.storage.OpenSearchIndexScan; +import org.opensearch.sql.opensearch.storage.script.filter.FilterQueryBuilder; +import org.opensearch.sql.opensearch.storage.script.sort.SortQueryBuilder; +import org.opensearch.sql.opensearch.storage.serialization.DefaultExpressionSerializer; +import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalLimit; +import org.opensearch.sql.planner.logical.LogicalProject; +import org.opensearch.sql.planner.logical.LogicalSort; +import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.TableScanOperator; + +/** + * Index scan builder for simple non-aggregate query used by + * {@link OpenSearchIndexScanBuilder} internally. + */ +@VisibleForTesting +class OpenSearchSimpleIndexScanBuilder extends TableScanBuilder { + + /** OpenSearch index scan to be optimized. */ + @EqualsAndHashCode.Include + private final OpenSearchIndexScan indexScan; + + /** + * Initialize with given index scan and perform push-down optimization later. + * + * @param indexScan index scan not optimized yet + */ + OpenSearchSimpleIndexScanBuilder(OpenSearchIndexScan indexScan) { + this.indexScan = indexScan; + } + + @Override + public TableScanOperator build() { + return indexScan; + } + + @Override + public boolean pushDownFilter(LogicalFilter filter) { + FilterQueryBuilder queryBuilder = new FilterQueryBuilder( + new DefaultExpressionSerializer()); + QueryBuilder query = queryBuilder.build(filter.getCondition()); + indexScan.getRequestBuilder().pushDown(query); + return true; + } + + @Override + public boolean pushDownSort(LogicalSort sort) { + if (!sortByFieldsOnly(sort)) { + return false; + } + + List> sortList = sort.getSortList(); + final SortQueryBuilder builder = new SortQueryBuilder(); + indexScan.getRequestBuilder().pushDownSort(sortList.stream() + .map(sortItem -> builder.build(sortItem.getValue(), sortItem.getKey())) + .collect(Collectors.toList())); + return true; + } + + @Override + public boolean pushDownLimit(LogicalLimit limit) { + indexScan.getRequestBuilder().pushDownLimit(limit.getLimit(), limit.getOffset()); + return true; + } + + @Override + public boolean pushDownProject(LogicalProject project) { + indexScan.getRequestBuilder().pushDownProjects( + findReferenceExpressions(project.getProjectList())); + + // Return false intentionally to keep the original project operator + return false; + } + + private boolean sortByFieldsOnly(LogicalSort sort) { + return sort.getSortList().stream() + .map(sortItem -> sortItem.getRight() instanceof ReferenceExpression) + .reduce(true, Boolean::logicalAnd); + } + + /** + * Find reference expression from expression. + * @param expressions a list of expression. + * + * @return a list of ReferenceExpression + */ + public static Set findReferenceExpressions( + List expressions) { + Set projectList = new HashSet<>(); + for (NamedExpression namedExpression : expressions) { + projectList.addAll(findReferenceExpression(namedExpression)); + } + return projectList; + } + + /** + * Find reference expression from expression. + * @param expression expression. + * + * @return a list of ReferenceExpression + */ + public static List findReferenceExpression(NamedExpression expression) { + List results = new ArrayList<>(); + expression.accept(new ExpressionNodeVisitor<>() { + @Override + public Object visitReference(ReferenceExpression node, Object context) { + return results.add(node); + } + }, null); + return results; + } +} diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicOptimizerTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicOptimizerTest.java deleted file mode 100644 index 31ad2b2ee3..0000000000 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicOptimizerTest.java +++ /dev/null @@ -1,576 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical; - -import static org.junit.jupiter.api.Assertions.assertEquals; -import static org.opensearch.sql.data.model.ExprValueUtils.integerValue; -import static org.opensearch.sql.data.type.ExprCoreType.DOUBLE; -import static org.opensearch.sql.data.type.ExprCoreType.INTEGER; -import static org.opensearch.sql.data.type.ExprCoreType.LONG; -import static org.opensearch.sql.data.type.ExprCoreType.STRING; -import static org.opensearch.sql.opensearch.utils.Utils.indexScan; -import static org.opensearch.sql.opensearch.utils.Utils.indexScanAgg; -import static org.opensearch.sql.opensearch.utils.Utils.noProjects; -import static org.opensearch.sql.opensearch.utils.Utils.projects; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.aggregation; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.filter; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.limit; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.sort; - -import com.google.common.collect.ImmutableList; -import com.google.common.collect.ImmutableSet; -import org.apache.commons.lang3.tuple.Pair; -import org.junit.jupiter.api.Disabled; -import org.junit.jupiter.api.Test; -import org.junit.jupiter.api.extension.ExtendWith; -import org.mockito.Mock; -import org.mockito.junit.jupiter.MockitoExtension; -import org.opensearch.sql.ast.tree.Sort; -import org.opensearch.sql.expression.DSL; -import org.opensearch.sql.opensearch.utils.Utils; -import org.opensearch.sql.planner.logical.LogicalPlan; -import org.opensearch.sql.planner.optimizer.LogicalPlanOptimizer; -import org.opensearch.sql.storage.Table; - -@ExtendWith(MockitoExtension.class) -class OpenSearchLogicOptimizerTest { - - @Mock - private Table table; - - /** - * SELECT intV as i FROM schema WHERE intV = 1. - */ - @Test - void project_filter_merge_with_relation() { - assertEquals( - project( - indexScan("schema", - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))), - ImmutableSet.of(DSL.ref("intV", INTEGER))), - DSL.named("i", DSL.ref("intV", INTEGER)) - ), - optimize( - project( - filter( - relation("schema", table), - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) - ), - DSL.named("i", DSL.ref("intV", INTEGER))) - ) - ); - } - - /** - * SELECT avg(intV) FROM schema GROUP BY string_value. - */ - @Test - void aggregation_merge_relation() { - assertEquals( - project( - indexScanAgg("schema", ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), - optimize( - project( - aggregation( - relation("schema", table), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))) - ) - ); - } - - /** - * SELECT avg(intV) FROM schema WHERE intV = 1 GROUP BY string_value. - */ - @Test - void aggregation_merge_filter_relation() { - assertEquals( - project( - indexScanAgg("schema", - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), - optimize( - project( - aggregation( - filter( - relation("schema", table), - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) - ), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))) - ) - ); - } - - @Disabled("This test should be enabled once https://github.com/opensearch-project/sql/issues/912 is fixed") - @Test - void aggregation_cant_merge_indexScan_with_project() { - assertEquals( - aggregation( - OpenSearchLogicalIndexScan.builder().relationName("schema") - .filter(DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1)))) - .projectList(ImmutableSet.of(DSL.ref("intV", INTEGER))) - .build(), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - optimize( - aggregation( - OpenSearchLogicalIndexScan.builder().relationName("schema") - .filter(DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1)))) - .projectList( - ImmutableSet.of(DSL.ref("intV", INTEGER))) - .build(), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG)))))) - ); - } - - /** - * Sort - Relation --> IndexScan. - */ - @Test - void sort_merge_with_relation() { - assertEquals( - indexScan("schema", Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("intV", INTEGER))), - optimize( - sort( - relation("schema", table), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("intV", INTEGER)) - ) - ) - ); - } - - /** - * Sort - IndexScan --> IndexScan. - */ - @Test - void sort_merge_with_indexScan() { - assertEquals( - indexScan("schema", - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("intV", INTEGER)), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("longV", LONG))), - optimize( - sort( - indexScan("schema", Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("intV", INTEGER))), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("longV", LONG)) - ) - ) - ); - } - - /** - * Sort - Filter - Relation --> IndexScan. - */ - @Test - void sort_filter_merge_with_relation() { - assertEquals( - indexScan("schema", - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("longV", LONG)) - ), - optimize( - sort( - filter( - relation("schema", table), - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) - ), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("longV", LONG)) - ) - ) - ); - } - - @Test - void sort_with_expression_cannot_merge_with_relation() { - assertEquals( - sort( - relation("schema", table), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.abs(DSL.ref("intV", INTEGER))) - ), - optimize( - sort( - relation("schema", table), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.abs(DSL.ref("intV", INTEGER))) - ) - ) - ); - } - - /** - * SELECT avg(intV) FROM schema GROUP BY stringV ORDER BY stringV. - */ - @Test - void sort_merge_indexagg() { - assertEquals( - project( - indexScanAgg("schema", - ImmutableList.of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING))), - ImmutableList - .of(Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("stringV", STRING)))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), - optimize( - project( - sort( - aggregation( - relation("schema", table), - ImmutableList - .of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("stringV", STRING)) - ), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))) - ) - ); - } - - /** - * SELECT avg(intV) FROM schema GROUP BY stringV ORDER BY stringV. - */ - @Test - void sort_merge_indexagg_nulls_last() { - assertEquals( - project( - indexScanAgg("schema", - ImmutableList.of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING))), - ImmutableList - .of(Pair.of(Sort.SortOption.DEFAULT_DESC, DSL.ref("stringV", STRING)))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), - optimize( - project( - sort( - aggregation( - relation("schema", table), - ImmutableList - .of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - Pair.of(Sort.SortOption.DEFAULT_DESC, DSL.ref("stringV", STRING)) - ), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))) - ) - ); - } - - - /** - * Can't Optimize the following query. - * SELECT avg(intV) FROM schema GROUP BY stringV ORDER BY avg(intV). - */ - @Test - void sort_refer_to_aggregator_should_not_merge_with_indexAgg() { - assertEquals( - sort( - indexScanAgg("schema", - ImmutableList.of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - Pair.of(Sort.SortOption.DEFAULT_DESC, DSL.ref("AVG(intV)", INTEGER)) - ), - optimize( - sort( - indexScanAgg("schema", - ImmutableList.of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - Pair.of(Sort.SortOption.DEFAULT_DESC, DSL.ref("AVG(intV)", INTEGER)) - ) - ) - ); - } - - /** - * SELECT avg(intV) FROM schema GROUP BY stringV ORDER BY stringV ASC NULL_LAST. - */ - @Test - void sort_with_customized_option_should_merge_with_indexAgg() { - assertEquals( - indexScanAgg( - "schema", - ImmutableList.of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING))), - ImmutableList.of( - Pair.of( - new Sort.SortOption(Sort.SortOrder.ASC, Sort.NullOrder.NULL_LAST), - DSL.ref("stringV", STRING)))), - optimize( - sort( - indexScanAgg( - "schema", - ImmutableList.of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - Pair.of( - new Sort.SortOption(Sort.SortOrder.ASC, Sort.NullOrder.NULL_LAST), - DSL.ref("stringV", STRING))))); - } - - @Test - void limit_merge_with_relation() { - assertEquals( - project( - indexScan("schema", 1, 1, projects(DSL.ref("intV", INTEGER))), - DSL.named("intV", DSL.ref("intV", INTEGER)) - ), - optimize( - project( - limit( - relation("schema", table), - 1, 1 - ), - DSL.named("intV", DSL.ref("intV", INTEGER)) - ) - ) - ); - } - - @Test - void limit_merge_with_index_scan() { - assertEquals( - project( - indexScan("schema", - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))), - 1, 1, - projects(DSL.ref("intV", INTEGER)) - ), - DSL.named("intV", DSL.ref("intV", INTEGER)) - ), - optimize( - project( - limit( - filter( - relation("schema", table), - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) - ), 1, 1 - ), - DSL.named("intV", DSL.ref("intV", INTEGER))) - ) - ); - } - - @Test - void limit_merge_with_index_scan_sort() { - assertEquals( - project( - indexScan("schema", - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))), - 1, 1, - Utils.sort(DSL.ref("longV", LONG), Sort.SortOption.DEFAULT_ASC), - projects(DSL.ref("intV", INTEGER)) - ), - DSL.named("intV", DSL.ref("intV", INTEGER)) - ), - optimize( - project( - limit( - sort( - filter( - relation("schema", table), - DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) - ), - Pair.of(Sort.SortOption.DEFAULT_ASC, DSL.ref("longV", LONG)) - ), 1, 1 - ), - DSL.named("intV", DSL.ref("intV", INTEGER)) - ) - ) - ); - } - - @Test - void aggregation_cant_merge_index_scan_with_limit() { - assertEquals( - project( - aggregation( - indexScan("schema", 10, 0, noProjects()), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), - optimize( - project( - aggregation( - indexScan("schema", 10, 0, noProjects()), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))))); - } - - @Test - void push_down_projectList_to_relation() { - assertEquals( - project( - indexScan("schema", projects(DSL.ref("intV", INTEGER))), - DSL.named("i", DSL.ref("intV", INTEGER)) - ), - optimize( - project( - relation("schema", table), - DSL.named("i", DSL.ref("intV", INTEGER))) - ) - ); - } - - /** - * Project(intV, abs(intV)) -> Relation. - * -- will be optimized as - * Project(intV, abs(intV)) -> Relation(project=intV). - */ - @Test - void push_down_should_handle_duplication() { - assertEquals( - project( - indexScan("schema", projects(DSL.ref("intV", INTEGER))), - DSL.named("i", DSL.ref("intV", INTEGER)), - DSL.named("absi", DSL.abs(DSL.ref("intV", INTEGER))) - ), - optimize( - project( - relation("schema", table), - DSL.named("i", DSL.ref("intV", INTEGER)), - DSL.named("absi", DSL.abs(DSL.ref("intV", INTEGER)))) - ) - ); - } - - /** - * Project(ListA) -> Project(ListB) -> Relation. - * -- will be optimized as - * Project(ListA) -> Project(ListB) -> Relation(project=ListB). - */ - @Test - void only_one_project_should_be_push() { - assertEquals( - project( - project( - indexScan("schema", - projects(DSL.ref("intV", INTEGER), DSL.ref("stringV", STRING)) - ), - DSL.named("i", DSL.ref("intV", INTEGER)), - DSL.named("s", DSL.ref("stringV", STRING)) - ), - DSL.named("i", DSL.ref("intV", INTEGER)) - ), - optimize( - project( - project( - relation("schema", table), - DSL.named("i", DSL.ref("intV", INTEGER)), - DSL.named("s", DSL.ref("stringV", STRING)) - ), - DSL.named("i", DSL.ref("intV", INTEGER)) - ) - ) - ); - } - - @Test - void project_literal_no_push() { - assertEquals( - project( - relation("schema", table), - DSL.named("i", DSL.literal("str")) - ), - optimize( - project( - relation("schema", table), - DSL.named("i", DSL.literal("str")) - ) - ) - ); - } - - /** - * SELECT AVG(intV) FILTER(WHERE intV > 1) FROM schema GROUP BY stringV. - */ - @Test - void filter_aggregation_merge_relation() { - assertEquals( - project( - indexScanAgg("schema", ImmutableList.of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)) - .condition(DSL.greater(DSL.ref("intV", INTEGER), DSL.literal(1))))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - DSL.named("avg(intV) filter(where intV > 1)", DSL.ref("avg(intV)", DOUBLE))), - optimize( - project( - aggregation( - relation("schema", table), - ImmutableList.of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)) - .condition(DSL.greater(DSL.ref("intV", INTEGER), DSL.literal(1))))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - DSL.named("avg(intV) filter(where intV > 1)", DSL.ref("avg(intV)", DOUBLE))) - ) - ); - } - - /** - * SELECT AVG(intV) FILTER(WHERE intV > 1) FROM schema WHERE longV < 1 GROUP BY stringV. - */ - @Test - void filter_aggregation_merge_filter_relation() { - assertEquals( - project( - indexScanAgg("schema", - DSL.less(DSL.ref("longV", LONG), DSL.literal(1)), - ImmutableList.of(DSL.named("avg(intV)", - DSL.avg(DSL.ref("intV", INTEGER)) - .condition(DSL.greater(DSL.ref("intV", INTEGER), DSL.literal(1))))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - DSL.named("avg(intV) filter(where intV > 1)", DSL.ref("avg(intV)", DOUBLE))), - optimize( - project( - aggregation( - filter( - relation("schema", table), - DSL.less(DSL.ref("longV", LONG), DSL.literal(1)) - ), - ImmutableList.of(DSL.named("avg(intV)", - DSL.avg(DSL.ref("intV", INTEGER)) - .condition(DSL.greater(DSL.ref("intV", INTEGER), DSL.literal(1))))), - ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), - DSL.named("avg(intV) filter(where intV > 1)", DSL.ref("avg(intV)", DOUBLE))) - ) - ); - } - - private LogicalPlan optimize(LogicalPlan plan) { - final LogicalPlanOptimizer optimizer = OpenSearchLogicalPlanOptimizerFactory.create(); - final LogicalPlan optimize = optimizer.optimize(plan); - return optimize; - } -} diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScanTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScanTest.java deleted file mode 100644 index 2e10f33787..0000000000 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/planner/logical/OpenSearchLogicalIndexScanTest.java +++ /dev/null @@ -1,24 +0,0 @@ -/* - * Copyright OpenSearch Contributors - * SPDX-License-Identifier: Apache-2.0 - */ - - -package org.opensearch.sql.opensearch.planner.logical; - -import static org.junit.jupiter.api.Assertions.assertFalse; - -import com.google.common.collect.ImmutableSet; -import org.junit.jupiter.api.Test; - -class OpenSearchLogicalIndexScanTest { - - @Test - void has_projects() { - assertFalse(OpenSearchLogicalIndexScan.builder() - .projectList(ImmutableSet.of()).build() - .hasProjects()); - - assertFalse(OpenSearchLogicalIndexScan.builder().build().hasProjects()); - } -} diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java index a74c5fcbd4..dc8fb9d4cf 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java @@ -31,41 +31,20 @@ @ExtendWith(MockitoExtension.class) public class OpenSearchDefaultImplementorTest { - @Mock - OpenSearchIndexScan indexScan; @Mock OpenSearchClient client; @Mock Table table; - /** - * For test coverage. - */ - @Test - public void visitInvalidTypeShouldThrowException() { - final OpenSearchIndex.OpenSearchDefaultImplementor implementor = - new OpenSearchIndex.OpenSearchDefaultImplementor(indexScan, client); - - final IllegalStateException exception = - assertThrows(IllegalStateException.class, - () -> implementor.visitNode(relation("index", table), - indexScan)); - ; - assertEquals( - "unexpected plan node type " - + "class org.opensearch.sql.planner.logical.LogicalRelation", - exception.getMessage()); - } - @Test public void visitMachineLearning() { LogicalMLCommons node = Mockito.mock(LogicalMLCommons.class, Answers.RETURNS_DEEP_STUBS); Mockito.when(node.getChild().get(0)).thenReturn(Mockito.mock(LogicalPlan.class)); OpenSearchIndex.OpenSearchDefaultImplementor implementor = - new OpenSearchIndex.OpenSearchDefaultImplementor(indexScan, client); - assertNotNull(implementor.visitMLCommons(node, indexScan)); + new OpenSearchIndex.OpenSearchDefaultImplementor(client); + assertNotNull(implementor.visitMLCommons(node, null)); } @Test @@ -74,8 +53,8 @@ public void visitAD() { Answers.RETURNS_DEEP_STUBS); Mockito.when(node.getChild().get(0)).thenReturn(Mockito.mock(LogicalPlan.class)); OpenSearchIndex.OpenSearchDefaultImplementor implementor = - new OpenSearchIndex.OpenSearchDefaultImplementor(indexScan, client); - assertNotNull(implementor.visitAD(node, indexScan)); + new OpenSearchIndex.OpenSearchDefaultImplementor(client); + assertNotNull(implementor.visitAD(node, null)); } @Test @@ -84,8 +63,8 @@ public void visitML() { Answers.RETURNS_DEEP_STUBS); Mockito.when(node.getChild().get(0)).thenReturn(Mockito.mock(LogicalPlan.class)); OpenSearchIndex.OpenSearchDefaultImplementor implementor = - new OpenSearchIndex.OpenSearchDefaultImplementor(indexScan, client); - assertNotNull(implementor.visitML(node, indexScan)); + new OpenSearchIndex.OpenSearchDefaultImplementor(client); + assertNotNull(implementor.visitML(node, null)); } @Test @@ -93,10 +72,11 @@ public void visitHighlight() { LogicalHighlight node = Mockito.mock(LogicalHighlight.class, Answers.RETURNS_DEEP_STUBS); Mockito.when(node.getChild().get(0)).thenReturn(Mockito.mock(LogicalPlan.class)); + OpenSearchIndexScan indexScan = Mockito.mock(OpenSearchIndexScan.class); OpenSearchRequestBuilder requestBuilder = Mockito.mock(OpenSearchRequestBuilder.class); Mockito.when(indexScan.getRequestBuilder()).thenReturn(requestBuilder); OpenSearchIndex.OpenSearchDefaultImplementor implementor = - new OpenSearchIndex.OpenSearchDefaultImplementor(indexScan, client); + new OpenSearchIndex.OpenSearchDefaultImplementor(client); implementor.visitHighlight(node, indexScan); verify(requestBuilder).pushDownHighlight(any(), any()); diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java index 9e375aa1b0..f432d64dcc 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java @@ -9,8 +9,6 @@ import static org.hamcrest.MatcherAssert.assertThat; import static org.hamcrest.Matchers.aMapWithSize; import static org.hamcrest.Matchers.allOf; -import static org.hamcrest.Matchers.arrayContaining; -import static org.hamcrest.Matchers.emptyArray; import static org.hamcrest.Matchers.hasEntry; import static org.junit.jupiter.api.Assertions.assertEquals; import static org.junit.jupiter.api.Assertions.assertTrue; @@ -23,14 +21,7 @@ import static org.opensearch.sql.expression.DSL.named; import static org.opensearch.sql.expression.DSL.ref; import static org.opensearch.sql.opensearch.data.type.OpenSearchDataType.OPENSEARCH_TEXT_KEYWORD; -import static org.opensearch.sql.opensearch.utils.Utils.indexScan; -import static org.opensearch.sql.opensearch.utils.Utils.indexScanAgg; -import static org.opensearch.sql.opensearch.utils.Utils.noProjects; -import static org.opensearch.sql.opensearch.utils.Utils.projects; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.aggregation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.eval; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.filter; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.limit; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.remove; @@ -49,13 +40,11 @@ import org.junit.jupiter.api.extension.ExtendWith; import org.mockito.Mock; import org.mockito.junit.jupiter.MockitoExtension; -import org.opensearch.search.fetch.subphase.FetchSourceContext; import org.opensearch.sql.ast.tree.Sort; import org.opensearch.sql.common.setting.Settings; import org.opensearch.sql.data.model.ExprBooleanValue; import org.opensearch.sql.data.type.ExprCoreType; import org.opensearch.sql.data.type.ExprType; -import org.opensearch.sql.expression.DSL; import org.opensearch.sql.expression.Expression; import org.opensearch.sql.expression.NamedExpression; import org.opensearch.sql.expression.ReferenceExpression; @@ -67,12 +56,7 @@ import org.opensearch.sql.opensearch.mapping.IndexMapping; import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.logical.LogicalPlanDSL; -import org.opensearch.sql.planner.physical.AggregationOperator; -import org.opensearch.sql.planner.physical.FilterOperator; -import org.opensearch.sql.planner.physical.LimitOperator; -import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.planner.physical.PhysicalPlanDSL; -import org.opensearch.sql.planner.physical.ProjectOperator; import org.opensearch.sql.storage.Table; @ExtendWith(MockitoExtension.class) @@ -170,7 +154,7 @@ void implementRelationOperatorOnly() { when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - LogicalPlan plan = relation(indexName, table); + LogicalPlan plan = index.createScanBuilder(); Integer maxResultWindow = index.getMaxResultWindow(); assertEquals( new OpenSearchIndexScan(client, settings, indexName, maxResultWindow, exprValueFactory), @@ -182,7 +166,7 @@ void implementRelationOperatorWithOptimization() { when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - LogicalPlan plan = relation(indexName, table); + LogicalPlan plan = index.createScanBuilder(); Integer maxResultWindow = index.getMaxResultWindow(); assertEquals( new OpenSearchIndexScan(client, settings, indexName, maxResultWindow, exprValueFactory), @@ -217,7 +201,7 @@ void implementOtherLogicalOperators() { eval( remove( rename( - relation(indexName, table), + index.createScanBuilder(), mappings), exclude), newEvalField), @@ -243,214 +227,4 @@ void implementOtherLogicalOperators() { include), index.implement(plan)); } - - @Test - void shouldImplLogicalIndexScan() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - ReferenceExpression field = ref("name", STRING); - NamedExpression named = named("n", field); - Expression filterExpr = DSL.equal(field, literal("John")); - - PhysicalPlan plan = index.implement( - project( - indexScan( - indexName, - filterExpr - ), - named)); - - assertTrue(plan instanceof ProjectOperator); - assertTrue(((ProjectOperator) plan).getInput() instanceof OpenSearchIndexScan); - } - - @Test - void shouldNotPushDownFilterFarFromRelation() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - ReferenceExpression field = ref("name", STRING); - Expression filterExpr = DSL.equal(field, literal("John")); - List groupByExprs = Arrays.asList(named("age", ref("age", INTEGER))); - List aggregators = - Arrays.asList(named("avg(age)", new AvgAggregator(Arrays.asList(ref("age", INTEGER)), - DOUBLE))); - - PhysicalPlan plan = index.implement( - filter( - aggregation( - relation(indexName, table), - aggregators, - groupByExprs - ), - filterExpr)); - - assertTrue(plan instanceof FilterOperator); - } - - @Test - void shouldImplLogicalIndexScanAgg() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - ReferenceExpression field = ref("name", STRING); - Expression filterExpr = DSL.equal(field, literal("John")); - List groupByExprs = Arrays.asList(named("age", ref("age", INTEGER))); - List aggregators = - Arrays.asList(named("avg(age)", new AvgAggregator(Arrays.asList(ref("age", INTEGER)), - DOUBLE))); - - // IndexScanAgg without Filter - PhysicalPlan plan = index.implement( - filter( - indexScanAgg( - indexName, - aggregators, - groupByExprs - ), - filterExpr)); - - assertTrue(plan.getChild().get(0) instanceof OpenSearchIndexScan); - - // IndexScanAgg with Filter - plan = index.implement( - indexScanAgg( - indexName, - filterExpr, - aggregators, - groupByExprs)); - assertTrue(plan instanceof OpenSearchIndexScan); - } - - @Test - void shouldNotPushDownAggregationFarFromRelation() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - ReferenceExpression field = ref("name", STRING); - Expression filterExpr = DSL.equal(field, literal("John")); - List groupByExprs = Arrays.asList(named("age", ref("age", INTEGER))); - List aggregators = - Arrays.asList(named("avg(age)", new AvgAggregator(Arrays.asList(ref("age", INTEGER)), - DOUBLE))); - - PhysicalPlan plan = index.implement( - aggregation( - filter(filter( - relation(indexName, table), - filterExpr), filterExpr), - aggregators, - groupByExprs)); - assertTrue(plan instanceof AggregationOperator); - } - - @Test - void shouldImplIndexScanWithSort() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - ReferenceExpression field = ref("name", STRING); - NamedExpression named = named("n", field); - Expression sortExpr = ref("name", STRING); - - PhysicalPlan plan = index.implement( - project( - indexScan( - indexName, - Pair.of(Sort.SortOption.DEFAULT_ASC, sortExpr) - ), - named)); - - assertTrue(plan instanceof ProjectOperator); - assertTrue(((ProjectOperator) plan).getInput() instanceof OpenSearchIndexScan); - } - - @Test - void shouldImplIndexScanWithLimit() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - ReferenceExpression field = ref("name", STRING); - NamedExpression named = named("n", field); - - PhysicalPlan plan = index.implement( - project( - indexScan( - indexName, - 1, 1, noProjects() - ), - named)); - - assertTrue(plan instanceof ProjectOperator); - assertTrue(((ProjectOperator) plan).getInput() instanceof OpenSearchIndexScan); - } - - @Test - void shouldImplIndexScanWithSortAndLimit() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - ReferenceExpression field = ref("name", STRING); - NamedExpression named = named("n", field); - Expression sortExpr = ref("name", STRING); - - PhysicalPlan plan = index.implement( - project( - indexScan( - indexName, - sortExpr, - 1, 1, - noProjects() - ), - named)); - - assertTrue(plan instanceof ProjectOperator); - assertTrue(((ProjectOperator) plan).getInput() instanceof OpenSearchIndexScan); - } - - @Test - void shouldNotPushDownLimitFarFromRelationButUpdateScanSize() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - PhysicalPlan plan = index.implement(index.optimize( - project( - limit( - sort( - relation("test", table), - Pair.of(Sort.SortOption.DEFAULT_ASC, - DSL.abs(named("intV", ref("intV", INTEGER)))) - ), - 300, 1 - ), - named("intV", ref("intV", INTEGER)) - ) - )); - - assertTrue(plan instanceof ProjectOperator); - assertTrue(((ProjectOperator) plan).getInput() instanceof LimitOperator); - } - - @Test - void shouldPushDownProjects() { - when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); - when(client.getIndexMaxResultWindows("test")).thenReturn(Map.of("test", 10000)); - - PhysicalPlan plan = index.implement( - project( - indexScan( - indexName, projects(ref("intV", INTEGER)) - ), - named("i", ref("intV", INTEGER)))); - - assertTrue(plan instanceof ProjectOperator); - assertTrue(((ProjectOperator) plan).getInput() instanceof OpenSearchIndexScan); - - final FetchSourceContext fetchSource = - ((OpenSearchIndexScan) ((ProjectOperator) plan).getInput()).getRequestBuilder() - .getSourceBuilder().fetchSource(); - assertThat(fetchSource.includes(), arrayContaining("intV")); - assertThat(fetchSource.excludes(), emptyArray()); - } } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java new file mode 100644 index 0000000000..152b1ef1de --- /dev/null +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java @@ -0,0 +1,584 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + + +package org.opensearch.sql.opensearch.storage.scan; + +import static org.junit.jupiter.api.Assertions.assertEquals; +import static org.mockito.Mockito.reset; +import static org.mockito.Mockito.times; +import static org.mockito.Mockito.verify; +import static org.mockito.Mockito.when; +import static org.opensearch.sql.ast.tree.Sort.NullOrder.NULL_FIRST; +import static org.opensearch.sql.ast.tree.Sort.SortOrder.ASC; +import static org.opensearch.sql.data.model.ExprValueUtils.integerValue; +import static org.opensearch.sql.data.type.ExprCoreType.DOUBLE; +import static org.opensearch.sql.data.type.ExprCoreType.INTEGER; +import static org.opensearch.sql.data.type.ExprCoreType.LONG; +import static org.opensearch.sql.data.type.ExprCoreType.STRING; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.aggregation; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.filter; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.limit; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.sort; +import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_AGGREGATION; +import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_FILTER; +import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_LIMIT; +import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_PROJECT; +import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_SORT; + +import com.google.common.collect.ImmutableList; +import java.util.Arrays; +import java.util.Collections; +import java.util.HashSet; +import java.util.List; +import java.util.Map; +import lombok.Builder; +import org.apache.commons.lang3.tuple.Pair; +import org.junit.jupiter.api.BeforeEach; +import org.junit.jupiter.api.Test; +import org.junit.jupiter.api.extension.ExtendWith; +import org.mockito.Mock; +import org.mockito.junit.jupiter.MockitoExtension; +import org.opensearch.index.query.QueryBuilder; +import org.opensearch.index.query.QueryBuilders; +import org.opensearch.search.aggregations.AggregationBuilder; +import org.opensearch.search.aggregations.AggregationBuilders; +import org.opensearch.search.aggregations.bucket.composite.CompositeAggregationBuilder; +import org.opensearch.search.aggregations.bucket.composite.TermsValuesSourceBuilder; +import org.opensearch.search.sort.SortBuilder; +import org.opensearch.search.sort.SortBuilders; +import org.opensearch.search.sort.SortOrder; +import org.opensearch.sql.ast.tree.Sort.SortOption; +import org.opensearch.sql.data.type.ExprType; +import org.opensearch.sql.expression.DSL; +import org.opensearch.sql.expression.ReferenceExpression; +import org.opensearch.sql.opensearch.request.OpenSearchRequestBuilder; +import org.opensearch.sql.opensearch.response.agg.CompositeAggregationParser; +import org.opensearch.sql.opensearch.response.agg.OpenSearchAggregationResponseParser; +import org.opensearch.sql.opensearch.response.agg.SingleValueParser; +import org.opensearch.sql.opensearch.storage.OpenSearchIndexScan; +import org.opensearch.sql.opensearch.storage.script.aggregation.AggregationQueryBuilder; +import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.optimizer.LogicalPlanOptimizer; +import org.opensearch.sql.planner.optimizer.rule.scan.CreateTableScanBuilder; +import org.opensearch.sql.storage.Table; + + +@ExtendWith(MockitoExtension.class) +class OpenSearchIndexScanOptimizationTest { + + @Mock + private Table table; + + @Mock + private OpenSearchIndexScan indexScan; + + private OpenSearchIndexScanBuilder indexScanBuilder; + + @Mock + private OpenSearchRequestBuilder requestBuilder; + + private Runnable[] verifyPushDownCalls = {}; + + @BeforeEach + void setUp() { + indexScanBuilder = new OpenSearchIndexScanBuilder(indexScan); + when(table.createScanBuilder()).thenReturn(indexScanBuilder); + when(indexScan.getRequestBuilder()).thenReturn(requestBuilder); + } + + @Test + void test_project_push_down() { + assertEqualsAfterOptimization( + project( + indexScanAggBuilder( + withProjectPushedDown(DSL.ref("intV", INTEGER))), + DSL.named("i", DSL.ref("intV", INTEGER)) + ), + project( + relation("schema", table), + DSL.named("i", DSL.ref("intV", INTEGER))) + ); + } + + /** + * SELECT intV as i FROM schema WHERE intV = 1. + */ + @Test + void test_filter_push_down() { + assertEqualsAfterOptimization( + project( + indexScanBuilder( + //withProjectPushedDown(DSL.ref("intV", INTEGER)), + withFilterPushedDown(QueryBuilders.termQuery("intV", 1)) + ), + DSL.named("i", DSL.ref("intV", INTEGER)) + ), + project( + filter( + relation("schema", table), + DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) + ), + DSL.named("i", DSL.ref("intV", INTEGER)) + ) + ); + } + + /** + * SELECT avg(intV) FROM schema GROUP BY string_value. + */ + @Test + void test_aggregation_push_down() { + assertEqualsAfterOptimization( + project( + indexScanAggBuilder( + withAggregationPushedDown( + aggregate("AVG(intV)") + .aggregateBy("intV") + .groupBy("longV") + .resultTypes(Map.of( + "AVG(intV)", DOUBLE, + "longV", LONG)))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), + project( + aggregation( + relation("schema", table), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", DSL.ref("longV", LONG)))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE)) + ) + ); + } + + /* + @Disabled("This test should be enabled once https://github.com/opensearch-project/sql/issues/912 is fixed") + @Test + void aggregation_cant_merge_indexScan_with_project() { + assertEquals( + aggregation( + OpenSearchLogicalIndexScan.builder().relationName("schema") + .filter(DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1)))) + .projectList(ImmutableSet.of(DSL.ref("intV", INTEGER))) + .build(), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", + DSL.abs(DSL.ref("longV", LONG))))), + optimize( + aggregation( + OpenSearchLogicalIndexScan.builder().relationName("schema") + .filter(DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1)))) + .projectList( + ImmutableSet.of(DSL.ref("intV", INTEGER))) + .build(), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", + DSL.abs(DSL.ref("longV", LONG)))))) + ); + } + */ + + /** + * Sort - Relation --> IndexScan. + */ + @Test + void test_sort_push_down() { + assertEqualsAfterOptimization( + indexScanBuilder( + withSortPushedDown( + SortBuilders.fieldSort("intV").order(SortOrder.ASC).missing("_first")) + ), + sort( + relation("schema", table), + Pair.of(SortOption.DEFAULT_ASC, DSL.ref("intV", INTEGER)) + ) + ); + } + + @Test + void test_limit_push_down() { + assertEqualsAfterOptimization( + project( + indexScanBuilder( + withLimitPushedDown(1, 1)), + DSL.named("intV", DSL.ref("intV", INTEGER)) + ), + project( + limit( + relation("schema", table), + 1, 1), + DSL.named("intV", DSL.ref("intV", INTEGER)) + ) + ); + } + + /** + * SELECT avg(intV) FROM schema WHERE intV = 1 GROUP BY string_value. + */ + @Test + void test_aggregation_filter_push_down() { + assertEqualsAfterOptimization( + project( + indexScanAggBuilder( + withFilterPushedDown(QueryBuilders.termQuery("intV", 1)), + withAggregationPushedDown( + aggregate("AVG(intV)") + .aggregateBy("intV") + .groupBy("longV") + .resultTypes(Map.of( + "AVG(intV)", DOUBLE, + "longV", LONG)))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE)) + ), + project( + aggregation( + filter( + relation("schema", table), + DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) + ), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", DSL.ref("longV", LONG)))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE)) + ) + ); + } + + /** + * Sort - Filter - Relation --> IndexScan. + */ + @Test + void test_sort_filter_push_down() { + assertEqualsAfterOptimization( + indexScanBuilder( + withFilterPushedDown(QueryBuilders.termQuery("intV", 1)), + withSortPushedDown( + SortBuilders.fieldSort("longV").order(SortOrder.ASC).missing("_first")) + ), + sort( + filter( + relation("schema", table), + DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) + ), + Pair.of(SortOption.DEFAULT_ASC, DSL.ref("longV", LONG)) + ) + ); + } + + /** + * SELECT avg(intV) FROM schema GROUP BY stringV ORDER BY stringV. + */ + @Test + void test_sort_aggregation_push_down() { + assertEqualsAfterOptimization( + project( + indexScanAggBuilder( + withAggregationPushedDown( + aggregate("AVG(intV)") + .aggregateBy("intV") + .groupBy("stringV") + .sortBy(SortOption.DEFAULT_DESC) + .resultTypes(Map.of( + "AVG(intV)", DOUBLE, + "stringV", STRING)))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), + project( + sort( + aggregation( + relation("schema", table), + ImmutableList + .of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), + Pair.of(SortOption.DEFAULT_DESC, DSL.ref("stringV", STRING)) + ), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE)) + ) + ); + } + + @Test + void test_limit_sort_filter_push_down() { + assertEqualsAfterOptimization( + project( + indexScanBuilder( + withFilterPushedDown(QueryBuilders.termQuery("intV", 1)), + withSortPushedDown( + SortBuilders.fieldSort("longV").order(SortOrder.ASC).missing("_first")), + withLimitPushedDown(1, 1)), + DSL.named("intV", DSL.ref("intV", INTEGER)) + ), + project( + limit( + sort( + filter( + relation("schema", table), + DSL.equal(DSL.ref("intV", INTEGER), DSL.literal(integerValue(1))) + ), + Pair.of(SortOption.DEFAULT_ASC, DSL.ref("longV", LONG)) + ), 1, 1 + ), + DSL.named("intV", DSL.ref("intV", INTEGER)) + ) + ); + } + + /* + @Test + void aggregation_cant_merge_index_scan_with_limit() { + assertEquals( + project( + aggregation( + indexScan("schema", 10, 0, noProjects()), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", + DSL.abs(DSL.ref("longV", LONG))))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), + optimize( + project( + aggregation( + indexScan("schema", 10, 0, noProjects()), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", + DSL.abs(DSL.ref("longV", LONG))))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))))); + } + */ + + /** + * Project(intV, abs(intV)) -> Relation. + * -- will be optimized as + * Project(intV, abs(intV)) -> Relation(project=intV). + */ + /* + @Test + void push_down_should_handle_duplication() { + assertEquals( + project( + indexScan("schema", projects(DSL.ref("intV", INTEGER))), + DSL.named("i", DSL.ref("intV", INTEGER)), + DSL.named("absi", DSL.abs(DSL.ref("intV", INTEGER))) + ), + optimize( + project( + relation("schema", table), + DSL.named("i", DSL.ref("intV", INTEGER)), + DSL.named("absi", DSL.abs(DSL.ref("intV", INTEGER)))) + ) + ); + } + */ + + /* + * Project(ListA) -> Project(ListB) -> Relation. + * -- will be optimized as + * Project(ListA) -> Project(ListB) -> Relation(project=ListB). + */ + /* + @Test + void only_one_project_should_be_push() { + assertEquals( + project( + project( + indexScan("schema", + projects(DSL.ref("intV", INTEGER), DSL.ref("stringV", STRING)) + ), + DSL.named("i", DSL.ref("intV", INTEGER)), + DSL.named("s", DSL.ref("stringV", STRING)) + ), + DSL.named("i", DSL.ref("intV", INTEGER)) + ), + optimize( + project( + project( + relation("schema", table), + DSL.named("i", DSL.ref("intV", INTEGER)), + DSL.named("s", DSL.ref("stringV", STRING)) + ), + DSL.named("i", DSL.ref("intV", INTEGER)) + ) + ) + ); + } + */ + + @Test + void sort_with_expression_cannot_merge_with_relation() { + assertEqualsAfterOptimization( + sort( + indexScanAggBuilder(), + Pair.of(SortOption.DEFAULT_ASC, DSL.abs(DSL.ref("intV", INTEGER))) + ), + sort( + relation("schema", table), + Pair.of(SortOption.DEFAULT_ASC, DSL.abs(DSL.ref("intV", INTEGER))) + ) + ); + } + + + /** + * Can't Optimize the following query. + * SELECT avg(intV) FROM schema GROUP BY stringV ORDER BY avg(intV). + */ + @Test + void sort_refer_to_aggregator_should_not_merge_with_indexAgg() { + assertEqualsAfterOptimization( + project( + sort( + indexScanAggBuilder( + withAggregationPushedDown( + aggregate("AVG(intV)") + .aggregateBy("intV") + .groupBy("stringV") + .resultTypes(Map.of( + "AVG(intV)", DOUBLE, + "stringV", STRING)))), + Pair.of(SortOption.DEFAULT_ASC, DSL.ref("AVG(intV)", INTEGER)) + ), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), + project( + sort( + aggregation( + relation("schema", table), + ImmutableList + .of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), + Pair.of(SortOption.DEFAULT_ASC, DSL.ref("AVG(intV)", INTEGER)) + ), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE)) + ) + ); + } + + @Test + void project_literal_no_push() { + assertEqualsAfterOptimization( + project( + indexScanBuilder(), + DSL.named("i", DSL.literal("str")) + ), + optimize( + project( + relation("schema", table), + DSL.named("i", DSL.literal("str")) + ) + ) + ); + } + + private OpenSearchIndexScanBuilder indexScanBuilder(Runnable... verifyPushDownCalls) { + this.verifyPushDownCalls = verifyPushDownCalls; + return new OpenSearchIndexScanBuilder(new OpenSearchSimpleIndexScanBuilder(indexScan)); + } + + private OpenSearchIndexScanBuilder indexScanAggBuilder(Runnable... verifyPushDownCalls) { + this.verifyPushDownCalls = verifyPushDownCalls; + return new OpenSearchIndexScanBuilder(new OpenSearchAggregateIndexScanBuilder(indexScan)); + } + + private void assertEqualsAfterOptimization(LogicalPlan expected, LogicalPlan actual) { + assertEquals(expected, optimize(actual)); + + // Trigger build to make sure all push down actually happened in scan builder + indexScanBuilder.build(); + + // Verify to make sure all push down methods are called as expected + if (verifyPushDownCalls.length == 0) { + reset(indexScan); + } else { + Arrays.stream(verifyPushDownCalls).forEach(Runnable::run); + } + } + + private Runnable withFilterPushedDown(QueryBuilder filteringCondition) { + return () -> verify(requestBuilder, times(1)).pushDown(filteringCondition); + } + + private Runnable withAggregationPushedDown( + AggregationAssertHelper.AggregationAssertHelperBuilder aggregation) { + + // Assume single term bucket and AVG metric in all tests in this suite + CompositeAggregationBuilder aggBuilder = AggregationBuilders.composite( + "composite_buckets", + Collections.singletonList( + new TermsValuesSourceBuilder(aggregation.groupBy) + .field(aggregation.groupBy) + .order(aggregation.sortBy.getSortOrder() == ASC ? "asc" : "desc") + .missingOrder(aggregation.sortBy.getNullOrder() == NULL_FIRST ? "first" : "last") + .missingBucket(true))) + .subAggregation( + AggregationBuilders.avg(aggregation.aggregateName) + .field(aggregation.aggregateBy)) + .size(AggregationQueryBuilder.AGGREGATION_BUCKET_SIZE); + + List aggBuilders = Collections.singletonList(aggBuilder); + OpenSearchAggregationResponseParser responseParser = + new CompositeAggregationParser( + new SingleValueParser(aggregation.aggregateName)); + + return () -> { + verify(requestBuilder, times(1)).pushDownAggregation(Pair.of(aggBuilders, responseParser)); + verify(requestBuilder, times(1)).pushTypeMapping(aggregation.resultTypes); + }; + } + + private Runnable withSortPushedDown(SortBuilder... sorts) { + return () -> verify(requestBuilder, times(1)).pushDownSort(Arrays.asList(sorts)); + } + + private Runnable withLimitPushedDown(int size, int offset) { + return () -> verify(requestBuilder, times(1)).pushDownLimit(size, offset); + } + + private Runnable withProjectPushedDown(ReferenceExpression... references) { + return () -> verify(requestBuilder, times(1)).pushDownProjects( + new HashSet<>(Arrays.asList(references))); + } + + private static AggregationAssertHelper.AggregationAssertHelperBuilder aggregate(String aggName) { + var aggBuilder = new AggregationAssertHelper.AggregationAssertHelperBuilder(); + aggBuilder.aggregateName = aggName; + aggBuilder.sortBy = SortOption.DEFAULT_ASC; + return aggBuilder; + } + + /** Assertion helper for readability. */ + @Builder + private static class AggregationAssertHelper { + + String aggregateName; + + String aggregateBy; + + String groupBy; + + SortOption sortBy; + + Map resultTypes; + } + + private LogicalPlan optimize(LogicalPlan plan) { + LogicalPlanOptimizer optimizer = new LogicalPlanOptimizer(List.of( + new CreateTableScanBuilder(), + PUSH_DOWN_FILTER, + PUSH_DOWN_AGGREGATION, + PUSH_DOWN_SORT, + PUSH_DOWN_LIMIT, + PUSH_DOWN_PROJECT)); + return optimizer.optimize(plan); + } +} diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/utils/Utils.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/utils/Utils.java index 2ed9a16434..85b8889de3 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/utils/Utils.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/utils/Utils.java @@ -20,141 +20,10 @@ import org.opensearch.sql.expression.ReferenceExpression; import org.opensearch.sql.expression.aggregation.AvgAggregator; import org.opensearch.sql.expression.aggregation.NamedAggregator; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexAgg; -import org.opensearch.sql.opensearch.planner.logical.OpenSearchLogicalIndexScan; -import org.opensearch.sql.planner.logical.LogicalPlan; @UtilityClass public class Utils { - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, Expression filter) { - return OpenSearchLogicalIndexScan.builder().relationName(tableName) - .filter(filter) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, - Pair... sorts) { - return OpenSearchLogicalIndexScan.builder().relationName(tableName) - .sortList(Arrays.asList(sorts)) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, - Expression filter, - Pair... sorts) { - return OpenSearchLogicalIndexScan.builder().relationName(tableName) - .filter(filter) - .sortList(Arrays.asList(sorts)) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, Integer offset, Integer limit, - Set projectList) { - return OpenSearchLogicalIndexScan.builder().relationName(tableName) - .offset(offset) - .limit(limit) - .projectList(projectList) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, - Expression filter, - Integer offset, Integer limit, - Set projectList) { - return OpenSearchLogicalIndexScan.builder().relationName(tableName) - .filter(filter) - .offset(offset) - .limit(limit) - .projectList(projectList) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, - Expression filter, - Integer offset, Integer limit, - List> sorts, - Set projectList) { - return OpenSearchLogicalIndexScan.builder().relationName(tableName) - .filter(filter) - .sortList(sorts) - .offset(offset) - .limit(limit) - .projectList(projectList) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, - Set projects) { - return OpenSearchLogicalIndexScan.builder() - .relationName(tableName) - .projectList(projects) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexScan. - */ - public static LogicalPlan indexScan(String tableName, Expression filter, - Set projects) { - return OpenSearchLogicalIndexScan.builder() - .relationName(tableName) - .filter(filter) - .projectList(projects) - .build(); - } - - /** - * Build ElasticsearchLogicalIndexAgg. - */ - public static LogicalPlan indexScanAgg(String tableName, List aggregators, - List groupByList) { - return OpenSearchLogicalIndexAgg.builder().relationName(tableName) - .aggregatorList(aggregators).groupByList(groupByList).build(); - } - - /** - * Build ElasticsearchLogicalIndexAgg. - */ - public static LogicalPlan indexScanAgg(String tableName, List aggregators, - List groupByList, - List> sortList) { - return OpenSearchLogicalIndexAgg.builder().relationName(tableName) - .aggregatorList(aggregators).groupByList(groupByList).sortList(sortList).build(); - } - - /** - * Build ElasticsearchLogicalIndexAgg. - */ - public static LogicalPlan indexScanAgg(String tableName, - Expression filter, - List aggregators, - List groupByList) { - return OpenSearchLogicalIndexAgg.builder().relationName(tableName).filter(filter) - .aggregatorList(aggregators).groupByList(groupByList).build(); - } - public static AvgAggregator avg(Expression expr, ExprCoreType type) { return new AvgAggregator(Arrays.asList(expr), type); } From 24d4a6babd343388139c5e18b9e31d5247daeb66 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 21 Nov 2022 09:40:01 -0800 Subject: [PATCH 02/16] Fix jacoco test coverage Signed-off-by: Chen Dai --- .../scan/OpenSearchIndexScanBuilder.java | 18 +-- .../request/OpenSearchRequestBuilderTest.java | 108 +++++++++++++++--- .../storage/OpenSearchIndexTest.java | 41 ++++--- .../OpenSearchIndexScanOptimizationTest.java | 78 ++++++++----- 4 files changed, 175 insertions(+), 70 deletions(-) diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java index 9b34f78d5d..b7eec84e09 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java @@ -29,6 +29,8 @@ public class OpenSearchIndexScanBuilder extends TableScanBuilder { @EqualsAndHashCode.Include private TableScanBuilder delegate; + private boolean hasLimit = false; + @VisibleForTesting OpenSearchIndexScanBuilder(TableScanBuilder delegate) { this.delegate = delegate; @@ -55,19 +57,16 @@ public boolean pushDownFilter(LogicalFilter filter) { @Override public boolean pushDownAggregation(LogicalAggregation aggregation) { + if (hasLimit) { + return false; + } + // Switch to builder for aggregate query which has different push down logic - // for later filter, sort and limit operator. Change back if unable to push - // down aggregation. - TableScanBuilder oldDelegate = delegate; + // for later filter, sort and limit operator. delegate = new OpenSearchAggregateIndexScanBuilder( (OpenSearchIndexScan) delegate.build()); - if (delegate.pushDownAggregation(aggregation)) { - return true; - } else { - delegate = oldDelegate; - return false; - } + return delegate.pushDownAggregation(aggregation); } @Override @@ -77,6 +76,7 @@ public boolean pushDownSort(LogicalSort sort) { @Override public boolean pushDownLimit(LogicalLimit limit) { + hasLimit = true; return delegate.pushDownLimit(limit); } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java index 43b9353190..31bfd8ee26 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java @@ -7,41 +7,65 @@ package org.opensearch.sql.opensearch.request; import static org.junit.jupiter.api.Assertions.assertEquals; +import static org.mockito.Mockito.verify; import static org.mockito.Mockito.when; +import static org.opensearch.sql.data.type.ExprCoreType.INTEGER; +import java.util.Collections; +import java.util.List; +import java.util.Map; +import java.util.Set; +import org.apache.commons.lang3.tuple.Pair; import org.junit.jupiter.api.BeforeEach; import org.junit.jupiter.api.Test; import org.junit.jupiter.api.extension.ExtendWith; import org.mockito.Mock; import org.mockito.junit.jupiter.MockitoExtension; import org.opensearch.common.unit.TimeValue; +import org.opensearch.search.aggregations.AggregationBuilder; +import org.opensearch.search.aggregations.AggregationBuilders; +import org.opensearch.search.aggregations.bucket.composite.TermsValuesSourceBuilder; import org.opensearch.search.builder.SearchSourceBuilder; +import org.opensearch.search.sort.FieldSortBuilder; +import org.opensearch.search.sort.SortBuilders; import org.opensearch.sql.common.setting.Settings; +import org.opensearch.sql.data.type.ExprType; +import org.opensearch.sql.expression.DSL; +import org.opensearch.sql.expression.ReferenceExpression; import org.opensearch.sql.opensearch.data.value.OpenSearchExprValueFactory; +import org.opensearch.sql.opensearch.response.agg.CompositeAggregationParser; +import org.opensearch.sql.opensearch.response.agg.OpenSearchAggregationResponseParser; +import org.opensearch.sql.opensearch.response.agg.SingleValueParser; @ExtendWith(MockitoExtension.class) public class OpenSearchRequestBuilderTest { - public static final TimeValue DEFAULT_QUERY_TIMEOUT = TimeValue.timeValueMinutes(1L); + private static final TimeValue DEFAULT_QUERY_TIMEOUT = TimeValue.timeValueMinutes(1L); + private static final Integer DEFAULT_OFFSET = 0; + private static final Integer DEFAULT_LIMIT = 200; + private static final Integer MAX_RESULT_WINDOW = 500; + @Mock private Settings settings; @Mock - private OpenSearchExprValueFactory factory; + private OpenSearchExprValueFactory exprValueFactory; + + private OpenSearchRequestBuilder requestBuilder; @BeforeEach void setup() { when(settings.getSettingValue(Settings.Key.QUERY_SIZE_LIMIT)).thenReturn(200); + + requestBuilder = new OpenSearchRequestBuilder( + "test", MAX_RESULT_WINDOW, settings, exprValueFactory); } @Test void buildQueryRequest() { - Integer maxResultWindow = 500; Integer limit = 200; Integer offset = 0; - OpenSearchRequestBuilder builder = - new OpenSearchRequestBuilder("test", maxResultWindow, settings, factory); - builder.pushDownLimit(limit, offset); + requestBuilder.pushDownLimit(limit, offset); assertEquals( new OpenSearchQueryRequest( @@ -50,27 +74,81 @@ void buildQueryRequest() { .from(offset) .size(limit) .timeout(DEFAULT_QUERY_TIMEOUT), - factory), - builder.build()); + exprValueFactory), + requestBuilder.build()); } @Test void buildScrollRequestWithCorrectSize() { - Integer maxResultWindow = 500; Integer limit = 800; Integer offset = 10; - OpenSearchRequestBuilder builder = - new OpenSearchRequestBuilder("test", maxResultWindow, settings, factory); - builder.pushDownLimit(limit, offset); + requestBuilder.pushDownLimit(limit, offset); assertEquals( new OpenSearchScrollRequest( new OpenSearchRequest.IndexName("test"), new SearchSourceBuilder() .from(offset) - .size(maxResultWindow - offset) + .size(MAX_RESULT_WINDOW - offset) .timeout(DEFAULT_QUERY_TIMEOUT), - factory), - builder.build()); + exprValueFactory), + requestBuilder.build()); + } + + @Test + void testPushDownAggregation() { + AggregationBuilder aggBuilder = AggregationBuilders.composite( + "composite_buckets", + Collections.singletonList(new TermsValuesSourceBuilder("longA"))); + OpenSearchAggregationResponseParser responseParser = + new CompositeAggregationParser( + new SingleValueParser("AVG(intA)")); + requestBuilder.pushDownAggregation(Pair.of(List.of(aggBuilder), responseParser)); + + assertEquals( + new SearchSourceBuilder() + .from(DEFAULT_OFFSET) + .size(0) + .timeout(DEFAULT_QUERY_TIMEOUT) + .aggregation(aggBuilder), + requestBuilder.getSourceBuilder() + ); + verify(exprValueFactory).setParser(responseParser); + } + + @Test + void testPushDownSort() { + FieldSortBuilder sortBuilder = SortBuilders.fieldSort("intA"); + requestBuilder.pushDownSort(List.of(sortBuilder)); + + assertEquals( + new SearchSourceBuilder() + .from(DEFAULT_OFFSET) + .size(DEFAULT_LIMIT) + .timeout(DEFAULT_QUERY_TIMEOUT) + .sort(sortBuilder), + requestBuilder.getSourceBuilder()); + } + + @Test + void testPushDownProject() { + Set references = Set.of(DSL.ref("intA", INTEGER)); + requestBuilder.pushDownProjects(references); + + assertEquals( + new SearchSourceBuilder() + .from(DEFAULT_OFFSET) + .size(DEFAULT_LIMIT) + .timeout(DEFAULT_QUERY_TIMEOUT) + .fetchSource(new String[]{"intA"}, new String[0]), + requestBuilder.getSourceBuilder()); + } + + @Test + void testPushTypeMapping() { + Map typeMapping = Map.of("intA", INTEGER); + requestBuilder.pushTypeMapping(typeMapping); + + verify(exprValueFactory).setTypeMapping(typeMapping); } } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java index f432d64dcc..74c18f7c3d 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchIndexTest.java @@ -128,25 +128,28 @@ void getFieldTypes() { .put("blob", "binary") .build()))); - Map fieldTypes = index.getFieldTypes(); - assertThat( - fieldTypes, - allOf( - aMapWithSize(13), - hasEntry("name", ExprCoreType.STRING), - hasEntry("address", (ExprType) OpenSearchDataType.OPENSEARCH_TEXT), - hasEntry("age", ExprCoreType.INTEGER), - hasEntry("account_number", ExprCoreType.LONG), - hasEntry("balance1", ExprCoreType.FLOAT), - hasEntry("balance2", ExprCoreType.DOUBLE), - hasEntry("gender", ExprCoreType.BOOLEAN), - hasEntry("family", ExprCoreType.ARRAY), - hasEntry("employer", ExprCoreType.STRUCT), - hasEntry("birthday", ExprCoreType.TIMESTAMP), - hasEntry("id1", ExprCoreType.BYTE), - hasEntry("id2", ExprCoreType.SHORT), - hasEntry("blob", (ExprType) OpenSearchDataType.OPENSEARCH_BINARY) - )); + // Run more than once to confirm caching logic is covered and can work + for (int i = 0; i < 2; i++) { + Map fieldTypes = index.getFieldTypes(); + assertThat( + fieldTypes, + allOf( + aMapWithSize(13), + hasEntry("name", ExprCoreType.STRING), + hasEntry("address", (ExprType) OpenSearchDataType.OPENSEARCH_TEXT), + hasEntry("age", ExprCoreType.INTEGER), + hasEntry("account_number", ExprCoreType.LONG), + hasEntry("balance1", ExprCoreType.FLOAT), + hasEntry("balance2", ExprCoreType.DOUBLE), + hasEntry("gender", ExprCoreType.BOOLEAN), + hasEntry("family", ExprCoreType.ARRAY), + hasEntry("employer", ExprCoreType.STRUCT), + hasEntry("birthday", ExprCoreType.TIMESTAMP), + hasEntry("id1", ExprCoreType.BYTE), + hasEntry("id2", ExprCoreType.SHORT), + hasEntry("blob", (ExprType) OpenSearchDataType.OPENSEARCH_BINARY) + )); + } } @Test diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java index 152b1ef1de..50a83cdc5c 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java @@ -332,32 +332,6 @@ void test_limit_sort_filter_push_down() { ); } - /* - @Test - void aggregation_cant_merge_index_scan_with_limit() { - assertEquals( - project( - aggregation( - indexScan("schema", 10, 0, noProjects()), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), - optimize( - project( - aggregation( - indexScan("schema", 10, 0, noProjects()), - ImmutableList - .of(DSL.named("AVG(intV)", - DSL.avg(DSL.ref("intV", INTEGER)))), - ImmutableList.of(DSL.named("longV", - DSL.abs(DSL.ref("longV", LONG))))), - DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))))); - } - */ - /** * Project(intV, abs(intV)) -> Relation. * -- will be optimized as @@ -419,7 +393,7 @@ void only_one_project_should_be_push() { void sort_with_expression_cannot_merge_with_relation() { assertEqualsAfterOptimization( sort( - indexScanAggBuilder(), + indexScanBuilder(), Pair.of(SortOption.DEFAULT_ASC, DSL.abs(DSL.ref("intV", INTEGER))) ), sort( @@ -429,6 +403,56 @@ void sort_with_expression_cannot_merge_with_relation() { ); } + @Test + void sort_with_expression_cannot_merge_with_aggregation() { + assertEqualsAfterOptimization( + sort( + indexScanAggBuilder( + withAggregationPushedDown( + aggregate("AVG(intV)") + .aggregateBy("intV") + .groupBy("stringV") + .resultTypes(Map.of( + "AVG(intV)", DOUBLE, + "stringV", STRING)))), + Pair.of(SortOption.DEFAULT_ASC, DSL.abs(DSL.ref("intV", INTEGER))) + ), + sort( + aggregation( + relation("schema", table), + ImmutableList + .of(DSL.named("AVG(intV)", DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("stringV", DSL.ref("stringV", STRING)))), + Pair.of(SortOption.DEFAULT_ASC, DSL.abs(DSL.ref("intV", INTEGER))) + ) + ); + } + + @Test + void aggregation_cant_merge_index_scan_with_limit() { + assertEqualsAfterOptimization( + project( + aggregation( + indexScanBuilder( + withLimitPushedDown(10, 0)), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", + DSL.abs(DSL.ref("longV", LONG))))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE))), + project( + aggregation( + limit( + relation("schema", table), + 10, 0), + ImmutableList + .of(DSL.named("AVG(intV)", + DSL.avg(DSL.ref("intV", INTEGER)))), + ImmutableList.of(DSL.named("longV", + DSL.abs(DSL.ref("longV", LONG))))), + DSL.named("AVG(intV)", DSL.ref("AVG(intV)", DOUBLE)))); + } /** * Can't Optimize the following query. From d9cf5e878b24f5e15da9b262818f95db8d4ba998 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 21 Nov 2022 13:34:48 -0800 Subject: [PATCH 03/16] Update javadoc with more details Signed-off-by: Chen Dai --- .../optimizer/LogicalPlanOptimizer.java | 4 +- .../rule/scan/CreateTableScanBuilder.java | 8 +++- .../rule/scan/TableScanPushDown.java | 5 ++- .../org/opensearch/sql/storage/Table.java | 6 +-- .../sql/storage/TableScanBuilder.java | 42 +++++++++++++++++-- .../opensearch/storage/OpenSearchIndex.java | 3 +- 6 files changed, 54 insertions(+), 14 deletions(-) diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java index d21abe182f..78c738b338 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java @@ -42,12 +42,12 @@ public LogicalPlanOptimizer(List> rules) { public static LogicalPlanOptimizer create() { return new LogicalPlanOptimizer(Arrays.asList( /* - * Phase 1: Transformations rely on static relation algebra equivalence + * Phase 1: Transformations that rely on relational algebra equivalence */ new MergeFilterAndFilter(), new PushFilterUnderSort(), /* - * Phase 2: Transformations rely on connector push down capability + * Phase 2: Transformations that rely on data source push down capability */ new CreateTableScanBuilder(), TableScanPushDown.PUSH_DOWN_FILTER, diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java index 845de5b890..ac6adf760a 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java @@ -19,12 +19,16 @@ import org.opensearch.sql.storage.TableScanBuilder; /** - * {@code RelationPushDown} defines a set of push down rules... + * Rule that replace logical relation operator to {@link TableScanBuilder} for later + * push down optimization. All push down optimization rules that depends on table scan + * builder needs to run after this. */ public class CreateTableScanBuilder implements Rule { + /** Capture the table inside matched logical relation operator. */ private final Capture
capture; + /** Pattern that matches logical relation operator. */ @Accessors(fluent = true) @Getter private final Pattern pattern; @@ -41,7 +45,7 @@ public CreateTableScanBuilder() { @Override public LogicalPlan apply(LogicalRelation plan, Captures captures) { TableScanBuilder scanBuilder = captures.get(capture).createScanBuilder(); - // TODO: temporary check to avoid impact and separate Prometheus refactor work + // TODO: Remove this after Prometheus refactored to new table scan builder too return (scanBuilder == null) ? plan : scanBuilder; } } diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java index e493fa5af6..5bd3f9f434 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java @@ -24,7 +24,10 @@ import org.opensearch.sql.storage.TableScanBuilder; /** - * Base class for all table scan push down rules. + * Rule template for all table scan push down rules. Because all push down optimization rules + * have similar workflow in common, such as a pattern that match an operator on top of table scan + * builder, and action that eliminates the original operator if pushed down, this class helps + * remove redundant code and improve readability. * * @param logical plan node type */ diff --git a/core/src/main/java/org/opensearch/sql/storage/Table.java b/core/src/main/java/org/opensearch/sql/storage/Table.java index 9c2812f8ba..0714811b10 100644 --- a/core/src/main/java/org/opensearch/sql/storage/Table.java +++ b/core/src/main/java/org/opensearch/sql/storage/Table.java @@ -46,7 +46,7 @@ default void create(Map schema) { * @return physical plan * @deprecated replaced by write/scan builder */ - @Deprecated(since = "2.5") + @Deprecated(since = "2.5.0") PhysicalPlan implement(LogicalPlan plan); /** @@ -57,7 +57,7 @@ default void create(Map schema) { * @return logical plan. * @deprecated replaced by write/scan builder */ - @Deprecated(since = "2.5") + @Deprecated(since = "2.5.0") default LogicalPlan optimize(LogicalPlan plan) { return plan; } @@ -67,7 +67,7 @@ default LogicalPlan optimize(LogicalPlan plan) { * @return table scan builder */ default TableScanBuilder createScanBuilder() { - return null; // TODO: enforce all connector to create one for unified optimizing workflow + return null; // TODO: Enforce all subclass to implement this later } } diff --git a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java index 24e812a1de..eee12f39c4 100644 --- a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java +++ b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java @@ -15,44 +15,78 @@ import org.opensearch.sql.planner.logical.LogicalSort; /** - * A {@code TableScanBuilder} represents transition state between logical planning - * and physical planning. + * A {@code TableScanBuilder} represents transition state between logical planning and + * physical planning. The concrete implementation class gets involved in the logical + * optimization through this abstraction and thus get the chance to handle push down + * optimization without intruding core engine. */ public abstract class TableScanBuilder extends LogicalPlan { + /** + * Construct and initialize children to empty list. + */ public TableScanBuilder() { super(Collections.emptyList()); } /** * Build table scan operator. + * * @return table scan operator */ public abstract TableScanOperator build(); /** - * Can a given filter be pushed down to table scan builder. Assume no such support + * Can a given filter operator be pushed down to table scan builder. Assume no such support * by default unless subclass override this. * - * @param filter filter node + * @param filter logical filter operator * @return true if pushed down, otherwise false */ public boolean pushDownFilter(LogicalFilter filter) { return false; } + /** + * Can a given aggregate operator be pushed down to table scan builder. Assume no such support + * by default unless subclass override this. + * + * @param aggregation logical aggregate operator + * @return true if pushed down, otherwise false + */ public boolean pushDownAggregation(LogicalAggregation aggregation) { return false; } + /** + * Can a given sort operator be pushed down to table scan builder. Assume no such support + * by default unless subclass override this. + * + * @param sort logical sort operator + * @return true if pushed down, otherwise false + */ public boolean pushDownSort(LogicalSort sort) { return false; } + /** + * Can a given limit operator be pushed down to table scan builder. Assume no such support + * by default unless subclass override this. + * + * @param limit logical limit operator + * @return true if pushed down, otherwise false + */ public boolean pushDownLimit(LogicalLimit limit) { return false; } + /** + * Can a given project operator be pushed down to table scan builder. Assume no such support + * by default unless subclass override this. + * + * @param project logical project operator + * @return true if pushed down, otherwise false + */ public boolean pushDownProject(LogicalProject project) { return false; } diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java index ada6341def..6dfebed6f5 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java @@ -110,8 +110,7 @@ public Integer getMaxResultWindow() { */ @Override public PhysicalPlan implement(LogicalPlan plan) { - // TODO: deprecate this and move to Planner. For now leave it here to - // avoid impact Prometheus optimize/implement logic + // TODO: Leave it here to avoid impact Prometheus, AD and highlight. Need to move to Planner. return plan.accept(new OpenSearchDefaultImplementor(client), null); } From 180e0f16d7a24577f6dacdac6bf5ac7ecd168b24 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 21 Nov 2022 14:35:39 -0800 Subject: [PATCH 04/16] Fix highlight pushdown issue Signed-off-by: Chen Dai --- .../optimizer/LogicalPlanOptimizer.java | 1 + .../planner/optimizer/pattern/Patterns.java | 8 ++++++ .../rule/scan/TableScanPushDown.java | 7 +++++ .../sql/storage/TableScanBuilder.java | 12 ++++++++ .../optimizer/LogicalPlanOptimizerTest.java | 17 +++++++++++ .../opensearch/storage/OpenSearchIndex.java | 9 ------ .../scan/OpenSearchIndexScanBuilder.java | 6 ++++ .../OpenSearchSimpleIndexScanBuilder.java | 10 +++++++ .../OpenSearchDefaultImplementorTest.java | 22 --------------- .../OpenSearchIndexScanOptimizationTest.java | 28 +++++++++++++++++++ 10 files changed, 89 insertions(+), 31 deletions(-) diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java index 78c738b338..536db28ae0 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java @@ -54,6 +54,7 @@ public static LogicalPlanOptimizer create() { TableScanPushDown.PUSH_DOWN_AGGREGATION, TableScanPushDown.PUSH_DOWN_SORT, TableScanPushDown.PUSH_DOWN_LIMIT, + TableScanPushDown.PUSH_DOWN_HIGHLIGHT, TableScanPushDown.PUSH_DOWN_PROJECT)); } diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java index b9768351c4..58ce8faf39 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java @@ -14,6 +14,7 @@ import lombok.experimental.UtilityClass; import org.opensearch.sql.planner.logical.LogicalAggregation; import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalHighlight; import org.opensearch.sql.planner.logical.LogicalLimit; import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.logical.LogicalProject; @@ -56,6 +57,13 @@ public static Pattern limit(Pattern pat return Pattern.typeOf(LogicalLimit.class).with(source(pattern)); } + /** + * Logical highlight operator with a given pattern on inner field. + */ + public static Pattern highlight(Pattern pattern) { + return Pattern.typeOf(LogicalHighlight.class).with(source(pattern)); + } + /** * Logical project operator with a given pattern on inner field. */ diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java index 5bd3f9f434..6372ba52ec 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java @@ -7,6 +7,7 @@ import static org.opensearch.sql.planner.optimizer.pattern.Patterns.aggregate; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.filter; +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.highlight; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.limit; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.project; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.scanBuilder; @@ -67,6 +68,12 @@ public class TableScanPushDown implements Rule { scanBuilder())) .apply((project, scanBuilder) -> scanBuilder.pushDownProject(project)); + public static final Rule PUSH_DOWN_HIGHLIGHT = + match( + highlight( + scanBuilder())) + .apply((highlight, scanBuilder) -> scanBuilder.pushDownHighlight(highlight)); + /** Pattern that matches a plan node. */ private final WithPattern pattern; diff --git a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java index eee12f39c4..b053599815 100644 --- a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java +++ b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java @@ -8,6 +8,7 @@ import java.util.Collections; import org.opensearch.sql.planner.logical.LogicalAggregation; import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalHighlight; import org.opensearch.sql.planner.logical.LogicalLimit; import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.logical.LogicalPlanNodeVisitor; @@ -91,6 +92,17 @@ public boolean pushDownProject(LogicalProject project) { return false; } + /** + * Can a given highlight operator be pushed down to table scan builder. Assume no such support + * by default unless subclass override this. + * + * @param highlight logical highlight operator + * @return true if pushed down, otherwise false + */ + public boolean pushDownHighlight(LogicalHighlight highlight) { + return false; + } + @Override public R accept(LogicalPlanNodeVisitor visitor, C context) { return visitor.visitScanBuilder(this, context); diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java index 4aba9efd10..7c2086f674 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java @@ -15,12 +15,14 @@ import static org.opensearch.sql.data.type.ExprCoreType.LONG; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.aggregation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.filter; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.highlight; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.limit; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.sort; import com.google.common.collect.ImmutableList; +import java.util.Collections; import java.util.Map; import org.apache.commons.lang3.tuple.Pair; import org.junit.jupiter.api.BeforeEach; @@ -232,6 +234,21 @@ void table_scan_builder_support_limit_push_down_can_apply_its_rule() { ); } + @Test + void table_scan_builder_support_highlight_push_down_can_apply_its_rule() { + when(tableScanBuilder.pushDownHighlight(any())).thenReturn(true); + + assertEquals( + tableScanBuilder, + optimize( + highlight( + relation("schema", table), + DSL.named("i", DSL.ref("intV", INTEGER)), + Collections.emptyMap()) + ) + ); + } + @Test void table_not_support_scan_builder_should_not_be_impact() { Mockito.reset(table, tableScanBuilder); diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java index 6dfebed6f5..bf7bf47ca1 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java @@ -11,7 +11,6 @@ import java.util.Map; import lombok.RequiredArgsConstructor; import org.opensearch.sql.common.setting.Settings; -import org.opensearch.sql.common.utils.StringUtils; import org.opensearch.sql.data.type.ExprType; import org.opensearch.sql.opensearch.client.OpenSearchClient; import org.opensearch.sql.opensearch.data.type.OpenSearchDataType; @@ -24,7 +23,6 @@ import org.opensearch.sql.opensearch.storage.scan.OpenSearchIndexScanBuilder; import org.opensearch.sql.planner.DefaultImplementor; import org.opensearch.sql.planner.logical.LogicalAD; -import org.opensearch.sql.planner.logical.LogicalHighlight; import org.opensearch.sql.planner.logical.LogicalML; import org.opensearch.sql.planner.logical.LogicalMLCommons; import org.opensearch.sql.planner.logical.LogicalPlan; @@ -151,12 +149,5 @@ public PhysicalPlan visitML(LogicalML node, OpenSearchIndexScan context) { return new MLOperator(visitChild(node, context), node.getArguments(), client.getNodeClient()); } - - @Override - public PhysicalPlan visitHighlight(LogicalHighlight node, OpenSearchIndexScan context) { - context.getRequestBuilder().pushDownHighlight( - StringUtils.unquoteText(node.getHighlightField().toString()), node.getArguments()); - return visitChild(node, context); - } } } diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java index b7eec84e09..35684b7e30 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java @@ -10,6 +10,7 @@ import org.opensearch.sql.opensearch.storage.OpenSearchIndexScan; import org.opensearch.sql.planner.logical.LogicalAggregation; import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalHighlight; import org.opensearch.sql.planner.logical.LogicalLimit; import org.opensearch.sql.planner.logical.LogicalProject; import org.opensearch.sql.planner.logical.LogicalSort; @@ -84,4 +85,9 @@ public boolean pushDownLimit(LogicalLimit limit) { public boolean pushDownProject(LogicalProject project) { return delegate.pushDownProject(project); } + + @Override + public boolean pushDownHighlight(LogicalHighlight highlight) { + return delegate.pushDownHighlight(highlight); + } } diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java index f8450112ed..4b3d2c7b26 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java @@ -15,6 +15,7 @@ import org.apache.commons.lang3.tuple.Pair; import org.opensearch.index.query.QueryBuilder; import org.opensearch.sql.ast.tree.Sort; +import org.opensearch.sql.common.utils.StringUtils; import org.opensearch.sql.expression.Expression; import org.opensearch.sql.expression.ExpressionNodeVisitor; import org.opensearch.sql.expression.NamedExpression; @@ -24,6 +25,7 @@ import org.opensearch.sql.opensearch.storage.script.sort.SortQueryBuilder; import org.opensearch.sql.opensearch.storage.serialization.DefaultExpressionSerializer; import org.opensearch.sql.planner.logical.LogicalFilter; +import org.opensearch.sql.planner.logical.LogicalHighlight; import org.opensearch.sql.planner.logical.LogicalLimit; import org.opensearch.sql.planner.logical.LogicalProject; import org.opensearch.sql.planner.logical.LogicalSort; @@ -93,6 +95,14 @@ public boolean pushDownProject(LogicalProject project) { return false; } + @Override + public boolean pushDownHighlight(LogicalHighlight highlight) { + indexScan.getRequestBuilder().pushDownHighlight( + StringUtils.unquoteText(highlight.getHighlightField().toString()), + highlight.getArguments()); + return true; + } + private boolean sortByFieldsOnly(LogicalSort sort) { return sort.getSortList().stream() .map(sortItem -> sortItem.getRight() instanceof ReferenceExpression) diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java index dc8fb9d4cf..d7e5955491 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/OpenSearchDefaultImplementorTest.java @@ -6,12 +6,7 @@ package org.opensearch.sql.opensearch.storage; -import static org.junit.jupiter.api.Assertions.assertEquals; import static org.junit.jupiter.api.Assertions.assertNotNull; -import static org.junit.jupiter.api.Assertions.assertThrows; -import static org.mockito.ArgumentMatchers.any; -import static org.mockito.Mockito.verify; -import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; import org.junit.jupiter.api.Test; import org.junit.jupiter.api.extension.ExtendWith; @@ -20,9 +15,7 @@ import org.mockito.Mockito; import org.mockito.junit.jupiter.MockitoExtension; import org.opensearch.sql.opensearch.client.OpenSearchClient; -import org.opensearch.sql.opensearch.request.OpenSearchRequestBuilder; import org.opensearch.sql.planner.logical.LogicalAD; -import org.opensearch.sql.planner.logical.LogicalHighlight; import org.opensearch.sql.planner.logical.LogicalML; import org.opensearch.sql.planner.logical.LogicalMLCommons; import org.opensearch.sql.planner.logical.LogicalPlan; @@ -66,19 +59,4 @@ public void visitML() { new OpenSearchIndex.OpenSearchDefaultImplementor(client); assertNotNull(implementor.visitML(node, null)); } - - @Test - public void visitHighlight() { - LogicalHighlight node = Mockito.mock(LogicalHighlight.class, - Answers.RETURNS_DEEP_STUBS); - Mockito.when(node.getChild().get(0)).thenReturn(Mockito.mock(LogicalPlan.class)); - OpenSearchIndexScan indexScan = Mockito.mock(OpenSearchIndexScan.class); - OpenSearchRequestBuilder requestBuilder = Mockito.mock(OpenSearchRequestBuilder.class); - Mockito.when(indexScan.getRequestBuilder()).thenReturn(requestBuilder); - OpenSearchIndex.OpenSearchDefaultImplementor implementor = - new OpenSearchIndex.OpenSearchDefaultImplementor(client); - - implementor.visitHighlight(node, indexScan); - verify(requestBuilder).pushDownHighlight(any(), any()); - } } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java index 50a83cdc5c..27bbcb820d 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java @@ -20,12 +20,14 @@ import static org.opensearch.sql.data.type.ExprCoreType.STRING; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.aggregation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.filter; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.highlight; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.limit; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.sort; import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_AGGREGATION; import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_FILTER; +import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_HIGHLIGHT; import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_LIMIT; import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_PROJECT; import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_SORT; @@ -52,9 +54,11 @@ import org.opensearch.search.sort.SortBuilder; import org.opensearch.search.sort.SortBuilders; import org.opensearch.search.sort.SortOrder; +import org.opensearch.sql.ast.expression.Literal; import org.opensearch.sql.ast.tree.Sort.SortOption; import org.opensearch.sql.data.type.ExprType; import org.opensearch.sql.expression.DSL; +import org.opensearch.sql.expression.HighlightExpression; import org.opensearch.sql.expression.ReferenceExpression; import org.opensearch.sql.opensearch.request.OpenSearchRequestBuilder; import org.opensearch.sql.opensearch.response.agg.CompositeAggregationParser; @@ -221,6 +225,25 @@ void test_limit_push_down() { ); } + @Test + void test_highlight_push_down() { + assertEqualsAfterOptimization( + project( + indexScanBuilder( + withHighlightPushedDown("*", Collections.emptyMap())), + DSL.named("highlight(*)", + new HighlightExpression(DSL.literal("*"))) + ), + project( + highlight( + relation("schema", table), + DSL.literal("*"), Collections.emptyMap()), + DSL.named("highlight(*)", + new HighlightExpression(DSL.literal("*"))) + ) + ); + } + /** * SELECT avg(intV) FROM schema WHERE intV = 1 GROUP BY string_value. */ @@ -573,6 +596,10 @@ private Runnable withProjectPushedDown(ReferenceExpression... references) { new HashSet<>(Arrays.asList(references))); } + private Runnable withHighlightPushedDown(String field, Map arguments) { + return () -> verify(requestBuilder, times(1)).pushDownHighlight(field, arguments); + } + private static AggregationAssertHelper.AggregationAssertHelperBuilder aggregate(String aggName) { var aggBuilder = new AggregationAssertHelper.AggregationAssertHelperBuilder(); aggBuilder.aggregateName = aggName; @@ -602,6 +629,7 @@ private LogicalPlan optimize(LogicalPlan plan) { PUSH_DOWN_AGGREGATION, PUSH_DOWN_SORT, PUSH_DOWN_LIMIT, + PUSH_DOWN_HIGHLIGHT, PUSH_DOWN_PROJECT)); return optimizer.optimize(plan); } From f455141beb9b073cd1005a01a7ab742c14db6cd8 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 21 Nov 2022 15:53:35 -0800 Subject: [PATCH 05/16] Rename new class more properly Signed-off-by: Chen Dai --- .../sql/planner/optimizer/LogicalPlanOptimizer.java | 4 +++- core/src/main/java/org/opensearch/sql/storage/Table.java | 6 +++--- .../sql/planner/optimizer/LogicalPlanOptimizerTest.java | 2 +- .../opensearch/sql/opensearch/storage/OpenSearchIndex.java | 2 +- ...lder.java => OpenSearchIndexScanAggregationBuilder.java} | 4 ++-- .../opensearch/storage/scan/OpenSearchIndexScanBuilder.java | 4 ++-- ...canBuilder.java => OpenSearchIndexScanQueryBuilder.java} | 4 ++-- .../storage/scan/OpenSearchIndexScanOptimizationTest.java | 4 ++-- 8 files changed, 16 insertions(+), 14 deletions(-) rename opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/{OpenSearchAggregateIndexScanBuilder.java => OpenSearchIndexScanAggregationBuilder.java} (95%) rename opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/{OpenSearchSimpleIndexScanBuilder.java => OpenSearchIndexScanQueryBuilder.java} (97%) diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java index 536db28ae0..8ec41b2764 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java @@ -79,7 +79,9 @@ private LogicalPlan internalOptimize(LogicalPlan plan) { if (match.isPresent()) { node = rule.apply(match.value(), match.captures()); - // Re-iterate all rules against the node if the node is replaced by any rule + // For new TableScanPushDown impl, pattern match doesn't necessarily cause + // push down to happen. So reiterate all rules against the node only if the node + // is actually replaced by any rule. // TODO: may need to introduce fixed point or maximum iteration limit in future if (node != match.value()) { done = false; diff --git a/core/src/main/java/org/opensearch/sql/storage/Table.java b/core/src/main/java/org/opensearch/sql/storage/Table.java index 0714811b10..c138dfae94 100644 --- a/core/src/main/java/org/opensearch/sql/storage/Table.java +++ b/core/src/main/java/org/opensearch/sql/storage/Table.java @@ -44,7 +44,7 @@ default void create(Map schema) { * * @param plan logical plan * @return physical plan - * @deprecated replaced by write/scan builder + * @deprecated because of new {@link TableScanBuilder} implementation */ @Deprecated(since = "2.5.0") PhysicalPlan implement(LogicalPlan plan); @@ -55,7 +55,7 @@ default void create(Map schema) { * * @param plan logical plan. * @return logical plan. - * @deprecated replaced by write/scan builder + * @deprecated because of new {@link TableScanBuilder} implementation */ @Deprecated(since = "2.5.0") default LogicalPlan optimize(LogicalPlan plan) { @@ -67,7 +67,7 @@ default LogicalPlan optimize(LogicalPlan plan) { * @return table scan builder */ default TableScanBuilder createScanBuilder() { - return null; // TODO: Enforce all subclass to implement this later + return null; // TODO: Enforce all subclasses to implement this later } } diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java index 7c2086f674..9d13347d51 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java @@ -243,7 +243,7 @@ void table_scan_builder_support_highlight_push_down_can_apply_its_rule() { optimize( highlight( relation("schema", table), - DSL.named("i", DSL.ref("intV", INTEGER)), + DSL.literal("*"), Collections.emptyMap()) ) ); diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java index bf7bf47ca1..4fbe135f2a 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java @@ -108,7 +108,7 @@ public Integer getMaxResultWindow() { */ @Override public PhysicalPlan implement(LogicalPlan plan) { - // TODO: Leave it here to avoid impact Prometheus, AD and highlight. Need to move to Planner. + // TODO: Leave it here to avoid impact Prometheus and AD operators. Need to move to Planner. return plan.accept(new OpenSearchDefaultImplementor(client), null); } diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchAggregateIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java similarity index 95% rename from opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchAggregateIndexScanBuilder.java rename to opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java index 95ece2939a..ef1949959e 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchAggregateIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java @@ -27,7 +27,7 @@ /** * Index scan builder for aggregate query used by {@link OpenSearchIndexScanBuilder} internally. */ -class OpenSearchAggregateIndexScanBuilder extends TableScanBuilder { +class OpenSearchIndexScanAggregationBuilder extends TableScanBuilder { /** OpenSearch index scan to be optimized. */ private final OpenSearchIndexScan indexScan; @@ -46,7 +46,7 @@ class OpenSearchAggregateIndexScanBuilder extends TableScanBuilder { * * @param indexScan index scan not fully optimized yet */ - OpenSearchAggregateIndexScanBuilder(OpenSearchIndexScan indexScan) { + OpenSearchIndexScanAggregationBuilder(OpenSearchIndexScan indexScan) { this.indexScan = indexScan; } diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java index 35684b7e30..ce54270de5 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java @@ -43,7 +43,7 @@ public class OpenSearchIndexScanBuilder extends TableScanBuilder { * @param indexScan index scan to optimize */ public OpenSearchIndexScanBuilder(OpenSearchIndexScan indexScan) { - this.delegate = new OpenSearchSimpleIndexScanBuilder(indexScan); + this.delegate = new OpenSearchIndexScanQueryBuilder(indexScan); } @Override @@ -64,7 +64,7 @@ public boolean pushDownAggregation(LogicalAggregation aggregation) { // Switch to builder for aggregate query which has different push down logic // for later filter, sort and limit operator. - delegate = new OpenSearchAggregateIndexScanBuilder( + delegate = new OpenSearchIndexScanAggregationBuilder( (OpenSearchIndexScan) delegate.build()); return delegate.pushDownAggregation(aggregation); diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java similarity index 97% rename from opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java rename to opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java index 4b3d2c7b26..f03659ca43 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchSimpleIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java @@ -37,7 +37,7 @@ * {@link OpenSearchIndexScanBuilder} internally. */ @VisibleForTesting -class OpenSearchSimpleIndexScanBuilder extends TableScanBuilder { +class OpenSearchIndexScanQueryBuilder extends TableScanBuilder { /** OpenSearch index scan to be optimized. */ @EqualsAndHashCode.Include @@ -48,7 +48,7 @@ class OpenSearchSimpleIndexScanBuilder extends TableScanBuilder { * * @param indexScan index scan not optimized yet */ - OpenSearchSimpleIndexScanBuilder(OpenSearchIndexScan indexScan) { + OpenSearchIndexScanQueryBuilder(OpenSearchIndexScan indexScan) { this.indexScan = indexScan; } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java index 27bbcb820d..d7a4e84b17 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java @@ -529,12 +529,12 @@ void project_literal_no_push() { private OpenSearchIndexScanBuilder indexScanBuilder(Runnable... verifyPushDownCalls) { this.verifyPushDownCalls = verifyPushDownCalls; - return new OpenSearchIndexScanBuilder(new OpenSearchSimpleIndexScanBuilder(indexScan)); + return new OpenSearchIndexScanBuilder(new OpenSearchIndexScanQueryBuilder(indexScan)); } private OpenSearchIndexScanBuilder indexScanAggBuilder(Runnable... verifyPushDownCalls) { this.verifyPushDownCalls = verifyPushDownCalls; - return new OpenSearchIndexScanBuilder(new OpenSearchAggregateIndexScanBuilder(indexScan)); + return new OpenSearchIndexScanBuilder(new OpenSearchIndexScanAggregationBuilder(indexScan)); } private void assertEqualsAfterOptimization(LogicalPlan expected, LogicalPlan actual) { From bcfe6af66867b78842c4baae47e74201c7d74a9c Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 21 Nov 2022 16:59:37 -0800 Subject: [PATCH 06/16] Fix default sort by doc issue Signed-off-by: Chen Dai --- .../request/OpenSearchRequestBuilder.java | 14 ++++++++++---- .../request/OpenSearchRequestBuilderTest.java | 10 +++++++--- .../scan/OpenSearchIndexScanOptimizationTest.java | 2 +- 3 files changed, 18 insertions(+), 8 deletions(-) diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java index c26413c622..1c61da8e7f 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java @@ -104,6 +104,9 @@ public OpenSearchRequestBuilder(OpenSearchRequest.IndexName indexName, * @return query request or scroll request */ public OpenSearchRequest build() { + // Sort by doc as long as no sort pushed down here, no matter if post-processing sort exists + sortByDocIfNoSortPushedDown(); + Integer from = sourceBuilder.from(); Integer size = sourceBuilder.size(); @@ -134,10 +137,6 @@ public void pushDown(QueryBuilder query) { .filter(query)); } } - - if (sourceBuilder.sorts() == null) { - sourceBuilder.sort(DOC_FIELD_NAME, ASC); // Make sure consistent order - } } /** @@ -220,4 +219,11 @@ public void pushTypeMapping(Map typeMapping) { private boolean isBoolFilterQuery(QueryBuilder current) { return (current instanceof BoolQueryBuilder); } + + private void sortByDocIfNoSortPushedDown() { + // Add sort to make sure consistent order + if (sourceBuilder.sorts() == null) { + sourceBuilder.sort(DOC_FIELD_NAME, ASC); + } + } } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java index 31bfd8ee26..868f9da935 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java @@ -9,6 +9,8 @@ import static org.junit.jupiter.api.Assertions.assertEquals; import static org.mockito.Mockito.verify; import static org.mockito.Mockito.when; +import static org.opensearch.search.sort.FieldSortBuilder.DOC_FIELD_NAME; +import static org.opensearch.search.sort.SortOrder.ASC; import static org.opensearch.sql.data.type.ExprCoreType.INTEGER; import java.util.Collections; @@ -73,7 +75,8 @@ void buildQueryRequest() { new SearchSourceBuilder() .from(offset) .size(limit) - .timeout(DEFAULT_QUERY_TIMEOUT), + .timeout(DEFAULT_QUERY_TIMEOUT) + .sort(DOC_FIELD_NAME, ASC), exprValueFactory), requestBuilder.build()); } @@ -90,8 +93,9 @@ void buildScrollRequestWithCorrectSize() { new SearchSourceBuilder() .from(offset) .size(MAX_RESULT_WINDOW - offset) - .timeout(DEFAULT_QUERY_TIMEOUT), - exprValueFactory), + .timeout(DEFAULT_QUERY_TIMEOUT) + .sort(DOC_FIELD_NAME, ASC), + exprValueFactory), requestBuilder.build()); } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java index d7a4e84b17..ab863ca234 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java @@ -512,7 +512,7 @@ void sort_refer_to_aggregator_should_not_merge_with_indexAgg() { } @Test - void project_literal_no_push() { + void project_literal_should_not_be_pushed_down() { assertEqualsAfterOptimization( project( indexScanBuilder(), From 5b2441ee693e657345eec7dd7a21353cf86d3db5 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 21 Nov 2022 17:37:21 -0800 Subject: [PATCH 07/16] Rename visit method and javadoc Signed-off-by: Chen Dai --- .../java/org/opensearch/sql/planner/DefaultImplementor.java | 2 +- .../opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java | 2 +- core/src/main/java/org/opensearch/sql/storage/Table.java | 1 + .../main/java/org/opensearch/sql/storage/TableScanBuilder.java | 2 +- 4 files changed, 4 insertions(+), 3 deletions(-) diff --git a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java index db9b0e8fae..f37f2bf218 100644 --- a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java +++ b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java @@ -125,7 +125,7 @@ public PhysicalPlan visitLimit(LogicalLimit node, C context) { } @Override - public PhysicalPlan visitScanBuilder(TableScanBuilder plan, C context) { + public PhysicalPlan visitTableScanBuilder(TableScanBuilder plan, C context) { return plan.build(); } diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java index 9840e3942d..5efa2f938f 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java @@ -24,7 +24,7 @@ public R visitRelation(LogicalRelation plan, C context) { return visitNode(plan, context); } - public R visitScanBuilder(TableScanBuilder plan, C context) { + public R visitTableScanBuilder(TableScanBuilder plan, C context) { return visitNode(plan, context); } diff --git a/core/src/main/java/org/opensearch/sql/storage/Table.java b/core/src/main/java/org/opensearch/sql/storage/Table.java index c138dfae94..4fbf17b93d 100644 --- a/core/src/main/java/org/opensearch/sql/storage/Table.java +++ b/core/src/main/java/org/opensearch/sql/storage/Table.java @@ -64,6 +64,7 @@ default LogicalPlan optimize(LogicalPlan plan) { /** * Create table scan builder for logical to physical transformation. + * * @return table scan builder */ default TableScanBuilder createScanBuilder() { diff --git a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java index b053599815..90e0bfdef7 100644 --- a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java +++ b/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java @@ -105,6 +105,6 @@ public boolean pushDownHighlight(LogicalHighlight highlight) { @Override public R accept(LogicalPlanNodeVisitor visitor, C context) { - return visitor.visitScanBuilder(this, context); + return visitor.visitTableScanBuilder(this, context); } } From 5dfad3853b601276757b5eb59d67774bc63f5545 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Tue, 22 Nov 2022 16:26:38 -0800 Subject: [PATCH 08/16] Move table scan builder and optimize rule to read package Signed-off-by: Chen Dai --- .../opensearch/sql/planner/DefaultImplementor.java | 2 +- .../planner/logical/LogicalPlanNodeVisitor.java | 2 +- .../planner/optimizer/LogicalPlanOptimizer.java | 4 ++-- .../sql/planner/optimizer/pattern/Patterns.java | 2 +- .../{scan => read}/CreateTableScanBuilder.java | 4 ++-- .../rule/{scan => read}/TableScanPushDown.java | 6 +++--- .../java/org/opensearch/sql/storage/Table.java | 1 + .../sql/storage/{ => read}/TableScanBuilder.java | 3 ++- .../sql/planner/DefaultImplementorTest.java | 2 +- .../logical/LogicalPlanNodeVisitorTest.java | 2 +- .../optimizer/LogicalPlanOptimizerTest.java | 2 +- .../sql/opensearch/storage/OpenSearchIndex.java | 2 +- .../OpenSearchIndexScanAggregationBuilder.java | 2 +- .../storage/scan/OpenSearchIndexScanBuilder.java | 2 +- .../scan/OpenSearchIndexScanQueryBuilder.java | 2 +- .../scan/OpenSearchIndexScanOptimizationTest.java | 14 +++++++------- 16 files changed, 27 insertions(+), 25 deletions(-) rename core/src/main/java/org/opensearch/sql/planner/optimizer/rule/{scan => read}/CreateTableScanBuilder.java (93%) rename core/src/main/java/org/opensearch/sql/planner/optimizer/rule/{scan => read}/TableScanPushDown.java (96%) rename core/src/main/java/org/opensearch/sql/storage/{ => read}/TableScanBuilder.java (97%) diff --git a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java index f37f2bf218..4a5276418d 100644 --- a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java +++ b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java @@ -34,7 +34,7 @@ import org.opensearch.sql.planner.physical.SortOperator; import org.opensearch.sql.planner.physical.ValuesOperator; import org.opensearch.sql.planner.physical.WindowOperator; -import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Default implementor for implementing logical to physical translation. "Default" here means all diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java index 5efa2f938f..0386eb6e2a 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java @@ -6,7 +6,7 @@ package org.opensearch.sql.planner.logical; -import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * The visitor of {@link LogicalPlan}. diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java index 8ec41b2764..f241e76993 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java @@ -15,8 +15,8 @@ import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.optimizer.rule.MergeFilterAndFilter; import org.opensearch.sql.planner.optimizer.rule.PushFilterUnderSort; -import org.opensearch.sql.planner.optimizer.rule.scan.CreateTableScanBuilder; -import org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown; +import org.opensearch.sql.planner.optimizer.rule.read.CreateTableScanBuilder; +import org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown; /** * {@link LogicalPlan} Optimizer. diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java index 58ce8faf39..0ba478594a 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java @@ -21,7 +21,7 @@ import org.opensearch.sql.planner.logical.LogicalRelation; import org.opensearch.sql.planner.logical.LogicalSort; import org.opensearch.sql.storage.Table; -import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Pattern helper class. diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/read/CreateTableScanBuilder.java similarity index 93% rename from core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java rename to core/src/main/java/org/opensearch/sql/planner/optimizer/rule/read/CreateTableScanBuilder.java index ac6adf760a..dbe61ca8c3 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/CreateTableScanBuilder.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/read/CreateTableScanBuilder.java @@ -3,7 +3,7 @@ * SPDX-License-Identifier: Apache-2.0 */ -package org.opensearch.sql.planner.optimizer.rule.scan; +package org.opensearch.sql.planner.optimizer.rule.read; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.table; @@ -16,7 +16,7 @@ import org.opensearch.sql.planner.logical.LogicalRelation; import org.opensearch.sql.planner.optimizer.Rule; import org.opensearch.sql.storage.Table; -import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Rule that replace logical relation operator to {@link TableScanBuilder} for later diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/read/TableScanPushDown.java similarity index 96% rename from core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java rename to core/src/main/java/org/opensearch/sql/planner/optimizer/rule/read/TableScanPushDown.java index 6372ba52ec..556a12bb34 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/scan/TableScanPushDown.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/read/TableScanPushDown.java @@ -3,7 +3,7 @@ * SPDX-License-Identifier: Apache-2.0 */ -package org.opensearch.sql.planner.optimizer.rule.scan; +package org.opensearch.sql.planner.optimizer.rule.read; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.aggregate; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.filter; @@ -12,7 +12,7 @@ import static org.opensearch.sql.planner.optimizer.pattern.Patterns.project; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.scanBuilder; import static org.opensearch.sql.planner.optimizer.pattern.Patterns.sort; -import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.TableScanPushDownBuilder.match; +import static org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown.TableScanPushDownBuilder.match; import com.facebook.presto.matching.Capture; import com.facebook.presto.matching.Captures; @@ -22,7 +22,7 @@ import java.util.function.BiFunction; import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.optimizer.Rule; -import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Rule template for all table scan push down rules. Because all push down optimization rules diff --git a/core/src/main/java/org/opensearch/sql/storage/Table.java b/core/src/main/java/org/opensearch/sql/storage/Table.java index 4fbf17b93d..b23b8596c1 100644 --- a/core/src/main/java/org/opensearch/sql/storage/Table.java +++ b/core/src/main/java/org/opensearch/sql/storage/Table.java @@ -10,6 +10,7 @@ import org.opensearch.sql.data.type.ExprType; import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.physical.PhysicalPlan; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Table. diff --git a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java b/core/src/main/java/org/opensearch/sql/storage/read/TableScanBuilder.java similarity index 97% rename from core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java rename to core/src/main/java/org/opensearch/sql/storage/read/TableScanBuilder.java index 90e0bfdef7..a7fe8ca297 100644 --- a/core/src/main/java/org/opensearch/sql/storage/TableScanBuilder.java +++ b/core/src/main/java/org/opensearch/sql/storage/read/TableScanBuilder.java @@ -3,7 +3,7 @@ * SPDX-License-Identifier: Apache-2.0 */ -package org.opensearch.sql.storage; +package org.opensearch.sql.storage.read; import java.util.Collections; import org.opensearch.sql.planner.logical.LogicalAggregation; @@ -14,6 +14,7 @@ import org.opensearch.sql.planner.logical.LogicalPlanNodeVisitor; import org.opensearch.sql.planner.logical.LogicalProject; import org.opensearch.sql.planner.logical.LogicalSort; +import org.opensearch.sql.storage.TableScanOperator; /** * A {@code TableScanBuilder} represents transition state between logical planning and diff --git a/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java b/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java index bcd39d28c3..2322e4684e 100644 --- a/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java @@ -56,8 +56,8 @@ import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.planner.physical.PhysicalPlanDSL; import org.opensearch.sql.storage.Table; -import org.opensearch.sql.storage.TableScanBuilder; import org.opensearch.sql.storage.TableScanOperator; +import org.opensearch.sql.storage.read.TableScanBuilder; @ExtendWith(MockitoExtension.class) class DefaultImplementorTest { diff --git a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java index 654586c844..33c6b02c38 100644 --- a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java @@ -32,8 +32,8 @@ import org.opensearch.sql.expression.aggregation.Aggregator; import org.opensearch.sql.expression.window.WindowDefinition; import org.opensearch.sql.storage.Table; -import org.opensearch.sql.storage.TableScanBuilder; import org.opensearch.sql.storage.TableScanOperator; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Todo. Temporary added for UT coverage, Will be removed. diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java index 9d13347d51..e2510ec464 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java @@ -38,7 +38,7 @@ import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.storage.Table; -import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.read.TableScanBuilder; @ExtendWith(MockitoExtension.class) class LogicalPlanOptimizerTest { diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java index 4fbe135f2a..c694769b89 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java @@ -28,7 +28,7 @@ import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.storage.Table; -import org.opensearch.sql.storage.TableScanBuilder; +import org.opensearch.sql.storage.read.TableScanBuilder; /** OpenSearch table (index) implementation. */ public class OpenSearchIndex implements Table { diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java index ef1949959e..b62acfbc6f 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java @@ -21,8 +21,8 @@ import org.opensearch.sql.opensearch.storage.serialization.DefaultExpressionSerializer; import org.opensearch.sql.planner.logical.LogicalAggregation; import org.opensearch.sql.planner.logical.LogicalSort; -import org.opensearch.sql.storage.TableScanBuilder; import org.opensearch.sql.storage.TableScanOperator; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Index scan builder for aggregate query used by {@link OpenSearchIndexScanBuilder} internally. diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java index ce54270de5..16ebd1abfe 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java @@ -14,8 +14,8 @@ import org.opensearch.sql.planner.logical.LogicalLimit; import org.opensearch.sql.planner.logical.LogicalProject; import org.opensearch.sql.planner.logical.LogicalSort; -import org.opensearch.sql.storage.TableScanBuilder; import org.opensearch.sql.storage.TableScanOperator; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Table scan builder that builds table scan operator for OpenSearch. The actual work is performed diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java index f03659ca43..29858be197 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java @@ -29,8 +29,8 @@ import org.opensearch.sql.planner.logical.LogicalLimit; import org.opensearch.sql.planner.logical.LogicalProject; import org.opensearch.sql.planner.logical.LogicalSort; -import org.opensearch.sql.storage.TableScanBuilder; import org.opensearch.sql.storage.TableScanOperator; +import org.opensearch.sql.storage.read.TableScanBuilder; /** * Index scan builder for simple non-aggregate query used by diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java index ab863ca234..6aa6f4446c 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java @@ -25,12 +25,12 @@ import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.sort; -import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_AGGREGATION; -import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_FILTER; -import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_HIGHLIGHT; -import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_LIMIT; -import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_PROJECT; -import static org.opensearch.sql.planner.optimizer.rule.scan.TableScanPushDown.PUSH_DOWN_SORT; +import static org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown.PUSH_DOWN_AGGREGATION; +import static org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown.PUSH_DOWN_FILTER; +import static org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown.PUSH_DOWN_HIGHLIGHT; +import static org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown.PUSH_DOWN_LIMIT; +import static org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown.PUSH_DOWN_PROJECT; +import static org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown.PUSH_DOWN_SORT; import com.google.common.collect.ImmutableList; import java.util.Arrays; @@ -68,7 +68,7 @@ import org.opensearch.sql.opensearch.storage.script.aggregation.AggregationQueryBuilder; import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.optimizer.LogicalPlanOptimizer; -import org.opensearch.sql.planner.optimizer.rule.scan.CreateTableScanBuilder; +import org.opensearch.sql.planner.optimizer.rule.read.CreateTableScanBuilder; import org.opensearch.sql.storage.Table; From 55310c9cb43973f6efda3e420d988e79b13791d1 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Tue, 22 Nov 2022 18:14:45 -0800 Subject: [PATCH 09/16] Fix sort push down issue Signed-off-by: Chen Dai --- .../request/OpenSearchRequestBuilder.java | 25 +++++-- .../request/OpenSearchRequestBuilderTest.java | 73 ++++++++++++++++++- 2 files changed, 87 insertions(+), 11 deletions(-) diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java index 1c61da8e7f..439a970a4f 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilder.java @@ -9,6 +9,8 @@ import static org.opensearch.search.sort.FieldSortBuilder.DOC_FIELD_NAME; import static org.opensearch.search.sort.SortOrder.ASC; +import com.google.common.collect.Lists; +import java.util.Arrays; import java.util.List; import java.util.Map; import java.util.Set; @@ -24,7 +26,9 @@ import org.opensearch.search.aggregations.AggregationBuilder; import org.opensearch.search.builder.SearchSourceBuilder; import org.opensearch.search.fetch.subphase.highlight.HighlightBuilder; +import org.opensearch.search.sort.FieldSortBuilder; import org.opensearch.search.sort.SortBuilder; +import org.opensearch.search.sort.SortBuilders; import org.opensearch.sql.ast.expression.Literal; import org.opensearch.sql.common.setting.Settings; import org.opensearch.sql.common.utils.StringUtils; @@ -104,9 +108,6 @@ public OpenSearchRequestBuilder(OpenSearchRequest.IndexName indexName, * @return query request or scroll request */ public OpenSearchRequest build() { - // Sort by doc as long as no sort pushed down here, no matter if post-processing sort exists - sortByDocIfNoSortPushedDown(); - Integer from = sourceBuilder.from(); Integer size = sourceBuilder.size(); @@ -137,6 +138,10 @@ public void pushDown(QueryBuilder query) { .filter(query)); } } + + if (sourceBuilder.sorts() == null) { + sourceBuilder.sort(DOC_FIELD_NAME, ASC); // Make sure consistent order + } } /** @@ -157,6 +162,11 @@ public void pushDownAggregation( * @param sortBuilders sortBuilders. */ public void pushDownSort(List> sortBuilders) { + // TODO: Sort by _doc is added when filter push down. Remove both logic once doctest fixed. + if (isSortByDocOnly()) { + sourceBuilder.sorts().clear(); + } + for (SortBuilder sortBuilder : sortBuilders) { sourceBuilder.sort(sortBuilder); } @@ -220,10 +230,11 @@ private boolean isBoolFilterQuery(QueryBuilder current) { return (current instanceof BoolQueryBuilder); } - private void sortByDocIfNoSortPushedDown() { - // Add sort to make sure consistent order - if (sourceBuilder.sorts() == null) { - sourceBuilder.sort(DOC_FIELD_NAME, ASC); + private boolean isSortByDocOnly() { + List> sorts = sourceBuilder.sorts(); + if (sorts != null) { + return sorts.equals(Arrays.asList(SortBuilders.fieldSort(DOC_FIELD_NAME))); } + return false; } } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java index 868f9da935..33376ece83 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/request/OpenSearchRequestBuilderTest.java @@ -24,11 +24,14 @@ import org.mockito.Mock; import org.mockito.junit.jupiter.MockitoExtension; import org.opensearch.common.unit.TimeValue; +import org.opensearch.index.query.QueryBuilder; +import org.opensearch.index.query.QueryBuilders; import org.opensearch.search.aggregations.AggregationBuilder; import org.opensearch.search.aggregations.AggregationBuilders; import org.opensearch.search.aggregations.bucket.composite.TermsValuesSourceBuilder; import org.opensearch.search.builder.SearchSourceBuilder; import org.opensearch.search.sort.FieldSortBuilder; +import org.opensearch.search.sort.ScoreSortBuilder; import org.opensearch.search.sort.SortBuilders; import org.opensearch.sql.common.setting.Settings; import org.opensearch.sql.data.type.ExprType; @@ -75,8 +78,7 @@ void buildQueryRequest() { new SearchSourceBuilder() .from(offset) .size(limit) - .timeout(DEFAULT_QUERY_TIMEOUT) - .sort(DOC_FIELD_NAME, ASC), + .timeout(DEFAULT_QUERY_TIMEOUT), exprValueFactory), requestBuilder.build()); } @@ -93,12 +95,27 @@ void buildScrollRequestWithCorrectSize() { new SearchSourceBuilder() .from(offset) .size(MAX_RESULT_WINDOW - offset) - .timeout(DEFAULT_QUERY_TIMEOUT) - .sort(DOC_FIELD_NAME, ASC), + .timeout(DEFAULT_QUERY_TIMEOUT), exprValueFactory), requestBuilder.build()); } + @Test + void testPushDownQuery() { + QueryBuilder query = QueryBuilders.termQuery("intA", 1); + requestBuilder.pushDown(query); + + assertEquals( + new SearchSourceBuilder() + .from(DEFAULT_OFFSET) + .size(DEFAULT_LIMIT) + .timeout(DEFAULT_QUERY_TIMEOUT) + .query(query) + .sort(DOC_FIELD_NAME, ASC), + requestBuilder.getSourceBuilder() + ); + } + @Test void testPushDownAggregation() { AggregationBuilder aggBuilder = AggregationBuilders.composite( @@ -120,6 +137,24 @@ void testPushDownAggregation() { verify(exprValueFactory).setParser(responseParser); } + @Test + void testPushDownQueryAndSort() { + QueryBuilder query = QueryBuilders.termQuery("intA", 1); + requestBuilder.pushDown(query); + + FieldSortBuilder sortBuilder = SortBuilders.fieldSort("intA"); + requestBuilder.pushDownSort(List.of(sortBuilder)); + + assertEquals( + new SearchSourceBuilder() + .from(DEFAULT_OFFSET) + .size(DEFAULT_LIMIT) + .timeout(DEFAULT_QUERY_TIMEOUT) + .query(query) + .sort(sortBuilder), + requestBuilder.getSourceBuilder()); + } + @Test void testPushDownSort() { FieldSortBuilder sortBuilder = SortBuilders.fieldSort("intA"); @@ -134,6 +169,36 @@ void testPushDownSort() { requestBuilder.getSourceBuilder()); } + @Test + void testPushDownNonFieldSort() { + ScoreSortBuilder sortBuilder = SortBuilders.scoreSort(); + requestBuilder.pushDownSort(List.of(sortBuilder)); + + assertEquals( + new SearchSourceBuilder() + .from(DEFAULT_OFFSET) + .size(DEFAULT_LIMIT) + .timeout(DEFAULT_QUERY_TIMEOUT) + .sort(sortBuilder), + requestBuilder.getSourceBuilder()); + } + + @Test + void testPushDownMultipleSort() { + requestBuilder.pushDownSort(List.of( + SortBuilders.fieldSort("intA"), + SortBuilders.fieldSort("intB"))); + + assertEquals( + new SearchSourceBuilder() + .from(DEFAULT_OFFSET) + .size(DEFAULT_LIMIT) + .timeout(DEFAULT_QUERY_TIMEOUT) + .sort(SortBuilders.fieldSort("intA")) + .sort(SortBuilders.fieldSort("intB")), + requestBuilder.getSourceBuilder()); + } + @Test void testPushDownProject() { Set references = Set.of(DSL.ref("intA", INTEGER)); From 837fcb87ad8b4f0c9451ef2ba4c328327c959d9c Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Wed, 23 Nov 2022 11:00:16 -0800 Subject: [PATCH 10/16] Move sortByFields to parent scan builder Signed-off-by: Chen Dai --- .../opensearch/sql/storage/read/TableScanBuilder.java | 8 ++++---- .../scan/OpenSearchIndexScanAggregationBuilder.java | 8 +------- .../storage/scan/OpenSearchIndexScanBuilder.java | 10 ++++++++++ .../storage/scan/OpenSearchIndexScanQueryBuilder.java | 10 ---------- 4 files changed, 15 insertions(+), 21 deletions(-) diff --git a/core/src/main/java/org/opensearch/sql/storage/read/TableScanBuilder.java b/core/src/main/java/org/opensearch/sql/storage/read/TableScanBuilder.java index a7fe8ca297..c0fdf36e70 100644 --- a/core/src/main/java/org/opensearch/sql/storage/read/TableScanBuilder.java +++ b/core/src/main/java/org/opensearch/sql/storage/read/TableScanBuilder.java @@ -17,10 +17,10 @@ import org.opensearch.sql.storage.TableScanOperator; /** - * A {@code TableScanBuilder} represents transition state between logical planning and - * physical planning. The concrete implementation class gets involved in the logical - * optimization through this abstraction and thus get the chance to handle push down - * optimization without intruding core engine. + * A TableScanBuilder represents transition state between logical planning and physical planning + * for table scan operator. The concrete implementation class gets involved in the logical + * optimization through this abstraction and thus get the chance to handle push down optimization + * without intruding core engine. */ public abstract class TableScanBuilder extends LogicalPlan { diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java index b62acfbc6f..e52fc566cd 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanAggregationBuilder.java @@ -71,7 +71,7 @@ public boolean pushDownAggregation(LogicalAggregation aggregation) { @Override public boolean pushDownSort(LogicalSort sort) { - if (!sortByFieldsOnly(sort) || hasAggregatorInSortBy(sort)) { + if (hasAggregatorInSortBy(sort)) { return false; } @@ -79,12 +79,6 @@ public boolean pushDownSort(LogicalSort sort) { return true; } - private boolean sortByFieldsOnly(LogicalSort sort) { - return sort.getSortList().stream() - .map(sortItem -> sortItem.getRight() instanceof ReferenceExpression) - .reduce(true, Boolean::logicalAnd); - } - private boolean hasAggregatorInSortBy(LogicalSort sort) { final Set aggregatorNames = aggregatorList.stream().map(NamedAggregator::getName).collect(Collectors.toSet()); diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java index 16ebd1abfe..38acdbff4a 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java @@ -7,6 +7,7 @@ import com.google.common.annotations.VisibleForTesting; import lombok.EqualsAndHashCode; +import org.opensearch.sql.expression.ReferenceExpression; import org.opensearch.sql.opensearch.storage.OpenSearchIndexScan; import org.opensearch.sql.planner.logical.LogicalAggregation; import org.opensearch.sql.planner.logical.LogicalFilter; @@ -72,6 +73,9 @@ public boolean pushDownAggregation(LogicalAggregation aggregation) { @Override public boolean pushDownSort(LogicalSort sort) { + if (!sortByFieldsOnly(sort)) { + return false; + } return delegate.pushDownSort(sort); } @@ -90,4 +94,10 @@ public boolean pushDownProject(LogicalProject project) { public boolean pushDownHighlight(LogicalHighlight highlight) { return delegate.pushDownHighlight(highlight); } + + private boolean sortByFieldsOnly(LogicalSort sort) { + return sort.getSortList().stream() + .map(sortItem -> sortItem.getRight() instanceof ReferenceExpression) + .reduce(true, Boolean::logicalAnd); + } } diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java index 29858be197..7190d58000 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanQueryBuilder.java @@ -68,10 +68,6 @@ public boolean pushDownFilter(LogicalFilter filter) { @Override public boolean pushDownSort(LogicalSort sort) { - if (!sortByFieldsOnly(sort)) { - return false; - } - List> sortList = sort.getSortList(); final SortQueryBuilder builder = new SortQueryBuilder(); indexScan.getRequestBuilder().pushDownSort(sortList.stream() @@ -103,12 +99,6 @@ public boolean pushDownHighlight(LogicalHighlight highlight) { return true; } - private boolean sortByFieldsOnly(LogicalSort sort) { - return sort.getSortList().stream() - .map(sortItem -> sortItem.getRight() instanceof ReferenceExpression) - .reduce(true, Boolean::logicalAnd); - } - /** * Find reference expression from expression. * @param expressions a list of expression. From 9d1109c54c2257dd94c08fdf3225693db5da1730 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Wed, 23 Nov 2022 13:59:17 -0800 Subject: [PATCH 11/16] Add back old test Signed-off-by: Chen Dai --- .../scan/OpenSearchIndexScanBuilder.java | 8 +-- .../OpenSearchIndexScanOptimizationTest.java | 49 +++++-------------- 2 files changed, 16 insertions(+), 41 deletions(-) diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java index 38acdbff4a..d7483cfcf0 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanBuilder.java @@ -31,7 +31,8 @@ public class OpenSearchIndexScanBuilder extends TableScanBuilder { @EqualsAndHashCode.Include private TableScanBuilder delegate; - private boolean hasLimit = false; + /** Is limit operator pushed down. */ + private boolean isLimitPushedDown = false; @VisibleForTesting OpenSearchIndexScanBuilder(TableScanBuilder delegate) { @@ -59,7 +60,7 @@ public boolean pushDownFilter(LogicalFilter filter) { @Override public boolean pushDownAggregation(LogicalAggregation aggregation) { - if (hasLimit) { + if (isLimitPushedDown) { return false; } @@ -81,7 +82,8 @@ public boolean pushDownSort(LogicalSort sort) { @Override public boolean pushDownLimit(LogicalLimit limit) { - hasLimit = true; + // Assume limit push down happening on OpenSearchIndexScanQueryBuilder + isLimitPushedDown = true; return delegate.pushDownLimit(limit); } diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java index 6aa6f4446c..363727cbd3 100644 --- a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/scan/OpenSearchIndexScanOptimizationTest.java @@ -355,62 +355,35 @@ void test_limit_sort_filter_push_down() { ); } - /** - * Project(intV, abs(intV)) -> Relation. - * -- will be optimized as - * Project(intV, abs(intV)) -> Relation(project=intV). - */ - /* - @Test - void push_down_should_handle_duplication() { - assertEquals( - project( - indexScan("schema", projects(DSL.ref("intV", INTEGER))), - DSL.named("i", DSL.ref("intV", INTEGER)), - DSL.named("absi", DSL.abs(DSL.ref("intV", INTEGER))) - ), - optimize( - project( - relation("schema", table), - DSL.named("i", DSL.ref("intV", INTEGER)), - DSL.named("absi", DSL.abs(DSL.ref("intV", INTEGER)))) - ) - ); - } - */ - /* * Project(ListA) -> Project(ListB) -> Relation. * -- will be optimized as * Project(ListA) -> Project(ListB) -> Relation(project=ListB). */ - /* @Test void only_one_project_should_be_push() { - assertEquals( + assertEqualsAfterOptimization( project( project( - indexScan("schema", - projects(DSL.ref("intV", INTEGER), DSL.ref("stringV", STRING)) - ), + indexScanBuilder( + withProjectPushedDown( + DSL.ref("intV", INTEGER), + DSL.ref("stringV", STRING))), DSL.named("i", DSL.ref("intV", INTEGER)), DSL.named("s", DSL.ref("stringV", STRING)) ), DSL.named("i", DSL.ref("intV", INTEGER)) ), - optimize( + project( project( - project( - relation("schema", table), - DSL.named("i", DSL.ref("intV", INTEGER)), - DSL.named("s", DSL.ref("stringV", STRING)) - ), - DSL.named("i", DSL.ref("intV", INTEGER)) - ) + relation("schema", table), + DSL.named("i", DSL.ref("intV", INTEGER)), + DSL.named("s", DSL.ref("stringV", STRING)) + ), + DSL.named("i", DSL.ref("intV", INTEGER)) ) ); } - */ @Test void sort_with_expression_cannot_merge_with_relation() { From 15d131de9b34532cb365652639616e212d35b94d Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 21 Nov 2022 17:33:25 -0800 Subject: [PATCH 12/16] Add table write operator and builder Signed-off-by: Chen Dai --- .../logical/LogicalPlanNodeVisitor.java | 5 +++ .../physical/PhysicalPlanNodeVisitor.java | 5 +++ .../org/opensearch/sql/storage/Table.java | 10 +++++ .../sql/storage/TableWriteBuilder.java | 38 +++++++++++++++++ .../sql/storage/TableWriteOperator.java | 41 +++++++++++++++++++ 5 files changed, 99 insertions(+) create mode 100644 core/src/main/java/org/opensearch/sql/storage/TableWriteBuilder.java create mode 100644 core/src/main/java/org/opensearch/sql/storage/TableWriteOperator.java diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java index 0386eb6e2a..f7330b5c3d 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java @@ -7,6 +7,7 @@ package org.opensearch.sql.planner.logical; import org.opensearch.sql.storage.read.TableScanBuilder; +import org.opensearch.sql.storage.TableWriteBuilder; /** * The visitor of {@link LogicalPlan}. @@ -28,6 +29,10 @@ public R visitTableScanBuilder(TableScanBuilder plan, C context) { return visitNode(plan, context); } + public R visitTableWriteBuilder(TableWriteBuilder plan, C context) { + return visitNode(plan, context); + } + public R visitFilter(LogicalFilter plan, C context) { return visitNode(plan, context); } diff --git a/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java b/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java index 63dd05cc6b..a5a578b1d4 100644 --- a/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java +++ b/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java @@ -7,6 +7,7 @@ package org.opensearch.sql.planner.physical; import org.opensearch.sql.storage.TableScanOperator; +import org.opensearch.sql.storage.TableWriteOperator; /** * The visitor of {@link PhysicalPlan}. @@ -36,6 +37,10 @@ public R visitTableScan(TableScanOperator node, C context) { return visitNode(node, context); } + public R visitTableWrite(TableWriteOperator node, C context) { + return visitNode(node, context); + } + public R visitProject(ProjectOperator node, C context) { return visitNode(node, context); } diff --git a/core/src/main/java/org/opensearch/sql/storage/Table.java b/core/src/main/java/org/opensearch/sql/storage/Table.java index ae0aaaf17b..8196071a68 100644 --- a/core/src/main/java/org/opensearch/sql/storage/Table.java +++ b/core/src/main/java/org/opensearch/sql/storage/Table.java @@ -73,6 +73,16 @@ default TableScanBuilder createScanBuilder() { return null; // TODO: Enforce all subclasses to implement this later } + /* + * Create table write builder for logical to physical transformation. + * + * @return table write builder + */ + default TableWriteBuilder createWriteBuilder() { + throw new UnsupportedOperationException( + "Write operation is not supported on current table"); + } + /** * Translate {@link Table} to {@link StreamingSource} if possible. */ diff --git a/core/src/main/java/org/opensearch/sql/storage/TableWriteBuilder.java b/core/src/main/java/org/opensearch/sql/storage/TableWriteBuilder.java new file mode 100644 index 0000000000..c174b00377 --- /dev/null +++ b/core/src/main/java/org/opensearch/sql/storage/TableWriteBuilder.java @@ -0,0 +1,38 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.storage; + +import java.util.Collections; +import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.logical.LogicalPlanNodeVisitor; + +/** + * A {@link TableWriteBuilder} represents transition state between logical planning and physical + * planning for table write operator. The concrete implementation class gets involved in the logical + * optimization through this abstraction and thus transform to specific {@link TableWriteOperator} in + * a certain data source. + */ +public abstract class TableWriteBuilder extends LogicalPlan { + + /** + * Construct table write builder with child node. + */ + public TableWriteBuilder(LogicalPlan child) { + super(Collections.singletonList(child)); + } + + /** + * Build table write operator. + * + * @return table write operator + */ + public abstract TableWriteOperator build(); + + @Override + public R accept(LogicalPlanNodeVisitor visitor, C context) { + return visitor.visitTableWriteBuilder(this, context); + } +} diff --git a/core/src/main/java/org/opensearch/sql/storage/TableWriteOperator.java b/core/src/main/java/org/opensearch/sql/storage/TableWriteOperator.java new file mode 100644 index 0000000000..5f922c51b4 --- /dev/null +++ b/core/src/main/java/org/opensearch/sql/storage/TableWriteOperator.java @@ -0,0 +1,41 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.storage; + +import java.util.Collections; +import java.util.List; +import lombok.RequiredArgsConstructor; +import org.opensearch.sql.planner.physical.PhysicalPlan; +import org.opensearch.sql.planner.physical.PhysicalPlanNodeVisitor; + +/** + * {@link TableWriteOperator} is the abstraction for data source to implement different physical + * write operator on a data source. This is also to avoid "polluting" physical plan visitor by + * concrete table scan implementation. + */ +@RequiredArgsConstructor +public abstract class TableWriteOperator extends PhysicalPlan { + + /** Child physical node. */ + private final PhysicalPlan child; + + @Override + public R accept(PhysicalPlanNodeVisitor visitor, C context) { + return visitor.visitTableWrite(this, context); + } + + @Override + public List getChild() { + return Collections.singletonList(child); + } + + /** + * Explain the execution plan. + * + * @return explain output + */ + public abstract String explain(); +} From 065c1599fb3ecdc336cb5b45bb3f73fb1e66998d Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Tue, 22 Nov 2022 15:11:11 -0800 Subject: [PATCH 13/16] Add UT for all new classes Signed-off-by: Chen Dai --- .../sql/planner/DefaultImplementor.java | 6 ++ .../sql/planner/logical/LogicalPlanDSL.java | 4 ++ .../logical/LogicalPlanNodeVisitor.java | 6 +- .../sql/planner/logical/LogicalWrite.java | 34 +++++++++ .../optimizer/LogicalPlanOptimizer.java | 4 +- .../planner/optimizer/pattern/Patterns.java | 11 +++ .../rule/write/CreateTableWriteBuilder.java | 48 +++++++++++++ .../physical/PhysicalPlanNodeVisitor.java | 2 +- .../org/opensearch/sql/storage/Table.java | 5 +- .../{ => write}/TableWriteBuilder.java | 12 ++-- .../{ => write}/TableWriteOperator.java | 2 +- .../sql/planner/DefaultImplementorTest.java | 15 ++++ .../logical/LogicalPlanNodeVisitorTest.java | 16 +++++ .../optimizer/LogicalPlanOptimizerTest.java | 35 ++++++++++ .../optimizer/pattern/PatternsTest.java | 1 + .../storage/write/TableWriteOperatorTest.java | 70 +++++++++++++++++++ 16 files changed, 261 insertions(+), 10 deletions(-) create mode 100644 core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java create mode 100644 core/src/main/java/org/opensearch/sql/planner/optimizer/rule/write/CreateTableWriteBuilder.java rename core/src/main/java/org/opensearch/sql/storage/{ => write}/TableWriteBuilder.java (74%) rename core/src/main/java/org/opensearch/sql/storage/{ => write}/TableWriteOperator.java (96%) create mode 100644 core/src/test/java/org/opensearch/sql/storage/write/TableWriteOperatorTest.java diff --git a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java index 4a5276418d..4a6d4d8222 100644 --- a/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java +++ b/core/src/main/java/org/opensearch/sql/planner/DefaultImplementor.java @@ -35,6 +35,7 @@ import org.opensearch.sql.planner.physical.ValuesOperator; import org.opensearch.sql.planner.physical.WindowOperator; import org.opensearch.sql.storage.read.TableScanBuilder; +import org.opensearch.sql.storage.write.TableWriteBuilder; /** * Default implementor for implementing logical to physical translation. "Default" here means all @@ -129,6 +130,11 @@ public PhysicalPlan visitTableScanBuilder(TableScanBuilder plan, C context) { return plan.build(); } + @Override + public PhysicalPlan visitTableWriteBuilder(TableWriteBuilder plan, C context) { + return plan.build(visitChild(plan, context)); + } + @Override public PhysicalPlan visitRelation(LogicalRelation node, C context) { throw new UnsupportedOperationException("Storage engine is responsible for " diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java index b18e099afa..842f46fb0b 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java @@ -32,6 +32,10 @@ @UtilityClass public class LogicalPlanDSL { + public static LogicalPlan write(LogicalPlan input, Table table) { + return new LogicalWrite(input, table); + } + public static LogicalPlan aggregation( LogicalPlan input, List aggregatorList, List groupByList) { return new LogicalAggregation(input, aggregatorList, groupByList); diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java index f7330b5c3d..9a41072fe7 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitor.java @@ -7,7 +7,7 @@ package org.opensearch.sql.planner.logical; import org.opensearch.sql.storage.read.TableScanBuilder; -import org.opensearch.sql.storage.TableWriteBuilder; +import org.opensearch.sql.storage.write.TableWriteBuilder; /** * The visitor of {@link LogicalPlan}. @@ -29,6 +29,10 @@ public R visitTableScanBuilder(TableScanBuilder plan, C context) { return visitNode(plan, context); } + public R visitWrite(LogicalWrite plan, C context) { + return visitNode(plan, context); + } + public R visitTableWriteBuilder(TableWriteBuilder plan, C context) { return visitNode(plan, context); } diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java new file mode 100644 index 0000000000..5993b2b4ec --- /dev/null +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java @@ -0,0 +1,34 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.planner.logical; + +import java.util.Collections; +import lombok.EqualsAndHashCode; +import lombok.Getter; +import lombok.ToString; +import org.opensearch.sql.storage.Table; + +/** + * Logical operator for insert statement. + */ +@EqualsAndHashCode(callSuper = true) +@ToString +public class LogicalWrite extends LogicalPlan { + + /** Table that handles the write operation. */ + @Getter + private final Table table; + + public LogicalWrite(LogicalPlan child, Table table) { + super(Collections.singletonList(child)); + this.table = table; + } + + @Override + public R accept(LogicalPlanNodeVisitor visitor, C context) { + return visitor.visitWrite(this, context); + } +} diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java index f241e76993..70847b869b 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizer.java @@ -17,6 +17,7 @@ import org.opensearch.sql.planner.optimizer.rule.PushFilterUnderSort; import org.opensearch.sql.planner.optimizer.rule.read.CreateTableScanBuilder; import org.opensearch.sql.planner.optimizer.rule.read.TableScanPushDown; +import org.opensearch.sql.planner.optimizer.rule.write.CreateTableWriteBuilder; /** * {@link LogicalPlan} Optimizer. @@ -55,7 +56,8 @@ public static LogicalPlanOptimizer create() { TableScanPushDown.PUSH_DOWN_SORT, TableScanPushDown.PUSH_DOWN_LIMIT, TableScanPushDown.PUSH_DOWN_HIGHLIGHT, - TableScanPushDown.PUSH_DOWN_PROJECT)); + TableScanPushDown.PUSH_DOWN_PROJECT, + new CreateTableWriteBuilder())); } /** diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java index 0ba478594a..b267658013 100644 --- a/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/pattern/Patterns.java @@ -20,6 +20,7 @@ import org.opensearch.sql.planner.logical.LogicalProject; import org.opensearch.sql.planner.logical.LogicalRelation; import org.opensearch.sql.planner.logical.LogicalSort; +import org.opensearch.sql.planner.logical.LogicalWrite; import org.opensearch.sql.storage.Table; import org.opensearch.sql.storage.read.TableScanBuilder; @@ -110,4 +111,14 @@ public static Property table() { ? Optional.of(((LogicalRelation) plan).getTable()) : Optional.empty()); } + + /** + * Logical relation with table field. + */ + public static Property writeTable() { + return Property.optionalProperty("table", + plan -> plan instanceof LogicalWrite + ? Optional.of(((LogicalWrite) plan).getTable()) + : Optional.empty()); + } } diff --git a/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/write/CreateTableWriteBuilder.java b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/write/CreateTableWriteBuilder.java new file mode 100644 index 0000000000..4fbf676862 --- /dev/null +++ b/core/src/main/java/org/opensearch/sql/planner/optimizer/rule/write/CreateTableWriteBuilder.java @@ -0,0 +1,48 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.planner.optimizer.rule.write; + +import static org.opensearch.sql.planner.optimizer.pattern.Patterns.writeTable; + +import com.facebook.presto.matching.Capture; +import com.facebook.presto.matching.Captures; +import com.facebook.presto.matching.Pattern; +import lombok.Getter; +import lombok.experimental.Accessors; +import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.logical.LogicalWrite; +import org.opensearch.sql.planner.optimizer.Rule; +import org.opensearch.sql.storage.Table; +import org.opensearch.sql.storage.write.TableWriteBuilder; + +/** + * Rule that replaces logical write operator with {@link TableWriteBuilder} for later optimization + * and transforming to physical operator. + */ +public class CreateTableWriteBuilder implements Rule { + + /** Capture the table inside matched logical relation operator. */ + private final Capture
capture; + + /** Pattern that matches logical relation operator. */ + @Accessors(fluent = true) + @Getter + private final Pattern pattern; + + /** + * Construct create table write builder rule. + */ + public CreateTableWriteBuilder() { + this.capture = Capture.newCapture(); + this.pattern = Pattern.typeOf(LogicalWrite.class) + .with(writeTable().capturedAs(capture)); + } + + @Override + public LogicalPlan apply(LogicalWrite plan, Captures captures) { + return captures.get(capture).createWriteBuilder(plan); + } +} diff --git a/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java b/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java index a5a578b1d4..d4bc4a1ea9 100644 --- a/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java +++ b/core/src/main/java/org/opensearch/sql/planner/physical/PhysicalPlanNodeVisitor.java @@ -7,7 +7,7 @@ package org.opensearch.sql.planner.physical; import org.opensearch.sql.storage.TableScanOperator; -import org.opensearch.sql.storage.TableWriteOperator; +import org.opensearch.sql.storage.write.TableWriteOperator; /** * The visitor of {@link PhysicalPlan}. diff --git a/core/src/main/java/org/opensearch/sql/storage/Table.java b/core/src/main/java/org/opensearch/sql/storage/Table.java index 8196071a68..496281fa8d 100644 --- a/core/src/main/java/org/opensearch/sql/storage/Table.java +++ b/core/src/main/java/org/opensearch/sql/storage/Table.java @@ -10,8 +10,10 @@ import org.opensearch.sql.data.type.ExprType; import org.opensearch.sql.executor.streaming.StreamingSource; import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.logical.LogicalWrite; import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.storage.read.TableScanBuilder; +import org.opensearch.sql.storage.write.TableWriteBuilder; /** * Table. @@ -76,9 +78,10 @@ default TableScanBuilder createScanBuilder() { /* * Create table write builder for logical to physical transformation. * + * @param plan logical write plan * @return table write builder */ - default TableWriteBuilder createWriteBuilder() { + default TableWriteBuilder createWriteBuilder(LogicalWrite plan) { throw new UnsupportedOperationException( "Write operation is not supported on current table"); } diff --git a/core/src/main/java/org/opensearch/sql/storage/TableWriteBuilder.java b/core/src/main/java/org/opensearch/sql/storage/write/TableWriteBuilder.java similarity index 74% rename from core/src/main/java/org/opensearch/sql/storage/TableWriteBuilder.java rename to core/src/main/java/org/opensearch/sql/storage/write/TableWriteBuilder.java index c174b00377..54dfa5d557 100644 --- a/core/src/main/java/org/opensearch/sql/storage/TableWriteBuilder.java +++ b/core/src/main/java/org/opensearch/sql/storage/write/TableWriteBuilder.java @@ -3,17 +3,18 @@ * SPDX-License-Identifier: Apache-2.0 */ -package org.opensearch.sql.storage; +package org.opensearch.sql.storage.write; import java.util.Collections; import org.opensearch.sql.planner.logical.LogicalPlan; import org.opensearch.sql.planner.logical.LogicalPlanNodeVisitor; +import org.opensearch.sql.planner.physical.PhysicalPlan; /** * A {@link TableWriteBuilder} represents transition state between logical planning and physical * planning for table write operator. The concrete implementation class gets involved in the logical - * optimization through this abstraction and thus transform to specific {@link TableWriteOperator} in - * a certain data source. + * optimization through this abstraction and thus transform to specific {@link TableWriteOperator} + * in a certain storage engine. */ public abstract class TableWriteBuilder extends LogicalPlan { @@ -25,11 +26,12 @@ public TableWriteBuilder(LogicalPlan child) { } /** - * Build table write operator. + * Build table write operator with given child node. * + * @param child child operator node * @return table write operator */ - public abstract TableWriteOperator build(); + public abstract TableWriteOperator build(PhysicalPlan child); @Override public R accept(LogicalPlanNodeVisitor visitor, C context) { diff --git a/core/src/main/java/org/opensearch/sql/storage/TableWriteOperator.java b/core/src/main/java/org/opensearch/sql/storage/write/TableWriteOperator.java similarity index 96% rename from core/src/main/java/org/opensearch/sql/storage/TableWriteOperator.java rename to core/src/main/java/org/opensearch/sql/storage/write/TableWriteOperator.java index 5f922c51b4..007b725677 100644 --- a/core/src/main/java/org/opensearch/sql/storage/TableWriteOperator.java +++ b/core/src/main/java/org/opensearch/sql/storage/write/TableWriteOperator.java @@ -3,7 +3,7 @@ * SPDX-License-Identifier: Apache-2.0 */ -package org.opensearch.sql.storage; +package org.opensearch.sql.storage.write; import java.util.Collections; import java.util.List; diff --git a/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java b/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java index 2322e4684e..017cfb60ea 100644 --- a/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/DefaultImplementorTest.java @@ -58,6 +58,8 @@ import org.opensearch.sql.storage.Table; import org.opensearch.sql.storage.TableScanOperator; import org.opensearch.sql.storage.read.TableScanBuilder; +import org.opensearch.sql.storage.write.TableWriteBuilder; +import org.opensearch.sql.storage.write.TableWriteOperator; @ExtendWith(MockitoExtension.class) class DefaultImplementorTest { @@ -212,4 +214,17 @@ public TableScanOperator build() { }; assertEquals(tableScanOperator, tableScanBuilder.accept(implementor, null)); } + + @Test + public void visitTableWriteBuilderShouldBuildTableWriteOperator() { + LogicalPlan child = values(); + TableWriteOperator tableWriteOperator = Mockito.mock(TableWriteOperator.class); + TableWriteBuilder logicalPlan = new TableWriteBuilder(child) { + @Override + public TableWriteOperator build(PhysicalPlan child) { + return tableWriteOperator; + } + }; + assertEquals(tableWriteOperator, logicalPlan.accept(implementor, null)); + } } diff --git a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java index 33c6b02c38..ccb951037a 100644 --- a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java @@ -31,9 +31,12 @@ import org.opensearch.sql.expression.ReferenceExpression; import org.opensearch.sql.expression.aggregation.Aggregator; import org.opensearch.sql.expression.window.WindowDefinition; +import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.storage.Table; import org.opensearch.sql.storage.TableScanOperator; import org.opensearch.sql.storage.read.TableScanBuilder; +import org.opensearch.sql.storage.write.TableWriteBuilder; +import org.opensearch.sql.storage.write.TableWriteOperator; /** * Todo. Temporary added for UT coverage, Will be removed. @@ -83,6 +86,19 @@ public TableScanOperator build() { assertNull(tableScanBuilder.accept(new LogicalPlanNodeVisitor() { }, null)); + LogicalPlan write = LogicalPlanDSL.write(null, table); + assertNull(write.accept(new LogicalPlanNodeVisitor() { + }, null)); + + TableWriteBuilder tableWriteBuilder = new TableWriteBuilder(null) { + @Override + public TableWriteOperator build(PhysicalPlan child) { + return null; + } + }; + assertNull(tableWriteBuilder.accept(new LogicalPlanNodeVisitor() { + }, null)); + LogicalPlan filter = LogicalPlanDSL.filter(relation, expression); assertNull(filter.accept(new LogicalPlanNodeVisitor() { }, null)); diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java index e2510ec464..137a830afd 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java @@ -7,6 +7,7 @@ package org.opensearch.sql.planner.optimizer; import static org.junit.jupiter.api.Assertions.assertEquals; +import static org.junit.jupiter.api.Assertions.assertThrows; import static org.mockito.ArgumentMatchers.any; import static org.mockito.Mockito.when; import static org.opensearch.sql.data.model.ExprValueUtils.integerValue; @@ -20,6 +21,8 @@ import static org.opensearch.sql.planner.logical.LogicalPlanDSL.project; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.relation; import static org.opensearch.sql.planner.logical.LogicalPlanDSL.sort; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.values; +import static org.opensearch.sql.planner.logical.LogicalPlanDSL.write; import com.google.common.collect.ImmutableList; import java.util.Collections; @@ -39,6 +42,7 @@ import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.storage.Table; import org.opensearch.sql.storage.read.TableScanBuilder; +import org.opensearch.sql.storage.write.TableWriteBuilder; @ExtendWith(MockitoExtension.class) class LogicalPlanOptimizerTest { @@ -270,6 +274,37 @@ public PhysicalPlan implement(LogicalPlan plan) { ); } + @Test + void table_support_write_builder_should_be_replaced() { + Mockito.reset(table, tableScanBuilder); + TableWriteBuilder writeBuilder = Mockito.mock(TableWriteBuilder.class); + when(table.createWriteBuilder(any())).thenReturn(writeBuilder); + + assertEquals( + writeBuilder, + optimize(write(values(), table)) + ); + } + + @Test + void table_not_support_write_builder_should_report_error() { + Mockito.reset(table, tableScanBuilder); + Table table = new Table() { + @Override + public Map getFieldTypes() { + return null; + } + + @Override + public PhysicalPlan implement(LogicalPlan plan) { + return null; + } + }; + + assertThrows(UnsupportedOperationException.class, + () -> table.createWriteBuilder(null)); + } + private LogicalPlan optimize(LogicalPlan plan) { final LogicalPlanOptimizer optimizer = LogicalPlanOptimizer.create(); final LogicalPlan optimize = optimizer.optimize(plan); diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java index 61d192362a..9f90fd8d05 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/pattern/PatternsTest.java @@ -35,5 +35,6 @@ void source_is_empty() { void table_is_empty() { plan = Mockito.mock(LogicalFilter.class); assertFalse(Patterns.table().getFunction().apply(plan).isPresent()); + assertFalse(Patterns.writeTable().getFunction().apply(plan).isPresent()); } } diff --git a/core/src/test/java/org/opensearch/sql/storage/write/TableWriteOperatorTest.java b/core/src/test/java/org/opensearch/sql/storage/write/TableWriteOperatorTest.java new file mode 100644 index 0000000000..8780b08276 --- /dev/null +++ b/core/src/test/java/org/opensearch/sql/storage/write/TableWriteOperatorTest.java @@ -0,0 +1,70 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.storage.write; + +import static org.junit.jupiter.api.Assertions.assertEquals; +import static org.junit.jupiter.api.Assertions.assertTrue; + +import java.util.Collections; +import org.junit.jupiter.api.BeforeEach; +import org.junit.jupiter.api.Test; +import org.junit.jupiter.api.extension.ExtendWith; +import org.mockito.Mock; +import org.mockito.junit.jupiter.MockitoExtension; +import org.opensearch.sql.data.model.ExprValue; +import org.opensearch.sql.planner.physical.PhysicalPlan; +import org.opensearch.sql.planner.physical.PhysicalPlanNodeVisitor; + +@ExtendWith(MockitoExtension.class) +class TableWriteOperatorTest { + + @Mock + private PhysicalPlan child; + + private TableWriteOperator tableWrite; + + @BeforeEach + void setUp() { + tableWrite = new TableWriteOperator(child) { + @Override + public String explain() { + return "explain"; + } + + @Override + public boolean hasNext() { + return false; + } + + @Override + public ExprValue next() { + return null; + } + }; + } + + @Test + void testAccept() { + Boolean isVisited = tableWrite.accept(new PhysicalPlanNodeVisitor<>() { + @Override + protected Boolean visitNode(PhysicalPlan node, Object context) { + return (node instanceof TableWriteOperator); + } + + @Override + public Boolean visitTableWrite(TableWriteOperator node, Object context) { + return super.visitTableWrite(node, context); + } + }, null); + + assertTrue(isVisited); + } + + @Test + void testGetChild() { + assertEquals(Collections.singletonList(child), tableWrite.getChild()); + } +} \ No newline at end of file From 9a7ca084f0b9b62e938f2d1a83c57aa6f98825b9 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Fri, 25 Nov 2022 14:54:28 -0800 Subject: [PATCH 14/16] Rename child field Signed-off-by: Chen Dai --- .../opensearch/sql/storage/write/TableWriteOperator.java | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/core/src/main/java/org/opensearch/sql/storage/write/TableWriteOperator.java b/core/src/main/java/org/opensearch/sql/storage/write/TableWriteOperator.java index 007b725677..92cdc6eb41 100644 --- a/core/src/main/java/org/opensearch/sql/storage/write/TableWriteOperator.java +++ b/core/src/main/java/org/opensearch/sql/storage/write/TableWriteOperator.java @@ -19,8 +19,8 @@ @RequiredArgsConstructor public abstract class TableWriteOperator extends PhysicalPlan { - /** Child physical node. */ - private final PhysicalPlan child; + /** Input physical node. */ + protected final PhysicalPlan input; @Override public R accept(PhysicalPlanNodeVisitor visitor, C context) { @@ -29,7 +29,7 @@ public R accept(PhysicalPlanNodeVisitor visitor, C context) { @Override public List getChild() { - return Collections.singletonList(child); + return Collections.singletonList(input); } /** From 0baec59c822bfdc5f2feb559a256397e76b9e610 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Fri, 25 Nov 2022 16:40:04 -0800 Subject: [PATCH 15/16] Add columns field Signed-off-by: Chen Dai --- .../sql/planner/logical/LogicalPlanDSL.java | 4 ++-- .../opensearch/sql/planner/logical/LogicalWrite.java | 12 ++++++++++-- .../planner/logical/LogicalPlanNodeVisitorTest.java | 3 ++- .../planner/optimizer/LogicalPlanOptimizerTest.java | 2 +- 4 files changed, 15 insertions(+), 6 deletions(-) diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java index 842f46fb0b..a192966287 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalPlanDSL.java @@ -32,8 +32,8 @@ @UtilityClass public class LogicalPlanDSL { - public static LogicalPlan write(LogicalPlan input, Table table) { - return new LogicalWrite(input, table); + public static LogicalPlan write(LogicalPlan input, Table table, List columns) { + return new LogicalWrite(input, table, columns); } public static LogicalPlan aggregation( diff --git a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java index 5993b2b4ec..496e6009e3 100644 --- a/core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java +++ b/core/src/main/java/org/opensearch/sql/planner/logical/LogicalWrite.java @@ -6,6 +6,7 @@ package org.opensearch.sql.planner.logical; import java.util.Collections; +import java.util.List; import lombok.EqualsAndHashCode; import lombok.Getter; import lombok.ToString; @@ -15,16 +16,23 @@ * Logical operator for insert statement. */ @EqualsAndHashCode(callSuper = true) +@Getter @ToString public class LogicalWrite extends LogicalPlan { /** Table that handles the write operation. */ - @Getter private final Table table; - public LogicalWrite(LogicalPlan child, Table table) { + /** Optional column name list specified in insert statement. */ + private final List columns; + + /** + * Construct a logical write with given child node, table and column name list. + */ + public LogicalWrite(LogicalPlan child, Table table, List columns) { super(Collections.singletonList(child)); this.table = table; + this.columns = columns; } @Override diff --git a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java index ccb951037a..341bcbc29e 100644 --- a/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/logical/LogicalPlanNodeVisitorTest.java @@ -12,6 +12,7 @@ import com.google.common.collect.ImmutableList; import com.google.common.collect.ImmutableMap; +import java.util.Collections; import java.util.HashMap; import java.util.Map; import java.util.stream.Collectors; @@ -86,7 +87,7 @@ public TableScanOperator build() { assertNull(tableScanBuilder.accept(new LogicalPlanNodeVisitor() { }, null)); - LogicalPlan write = LogicalPlanDSL.write(null, table); + LogicalPlan write = LogicalPlanDSL.write(null, table, Collections.emptyList()); assertNull(write.accept(new LogicalPlanNodeVisitor() { }, null)); diff --git a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java index 137a830afd..7516aa1809 100644 --- a/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java +++ b/core/src/test/java/org/opensearch/sql/planner/optimizer/LogicalPlanOptimizerTest.java @@ -282,7 +282,7 @@ void table_support_write_builder_should_be_replaced() { assertEquals( writeBuilder, - optimize(write(values(), table)) + optimize(write(values(), table, Collections.emptyList())) ); } From ed114707545e09b2a76462c4a0eaebcf4514bee7 Mon Sep 17 00:00:00 2001 From: Chen Dai Date: Mon, 5 Dec 2022 17:07:57 -0800 Subject: [PATCH 16/16] Add opensearch index write and builder Signed-off-by: Chen Dai --- .../opensearch/client/OpenSearchClient.java | 2 + .../client/OpenSearchNodeClient.java | 21 +++ .../client/OpenSearchRestClient.java | 15 +++ .../opensearch/storage/OpenSearchIndex.java | 17 +++ .../storage/write/OpenSearchIndexWrite.java | 125 ++++++++++++++++++ .../write/OpenSearchIndexWriteBuilder.java | 35 +++++ .../write/OpenSearchIndexWriteTest.java | 107 +++++++++++++++ 7 files changed, 322 insertions(+) create mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWrite.java create mode 100644 opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteBuilder.java create mode 100644 opensearch/src/test/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteTest.java diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchClient.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchClient.java index dc6e72bd91..572d7c3df2 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchClient.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchClient.java @@ -44,6 +44,8 @@ public interface OpenSearchClient { */ Map getIndexMappings(String... indexExpression); + void bulk(final String indexName, List> data); + /** * Fetch index.max_result_window settings according to index expression given. * diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchNodeClient.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchNodeClient.java index 13fb0f6391..95f8935c17 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchNodeClient.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchNodeClient.java @@ -24,6 +24,8 @@ import org.opensearch.action.admin.indices.get.GetIndexResponse; import org.opensearch.action.admin.indices.mapping.get.GetMappingsResponse; import org.opensearch.action.admin.indices.settings.get.GetSettingsResponse; +import org.opensearch.action.bulk.BulkRequestBuilder; +import org.opensearch.action.bulk.BulkResponse; import org.opensearch.client.node.NodeClient; import org.opensearch.cluster.metadata.AliasMetadata; import org.opensearch.cluster.metadata.IndexNameExpressionResolver; @@ -75,6 +77,25 @@ public void createIndex(String indexName, Map mappings) { } } + @Override + public void bulk(final String indexName, List> data) { + BulkResponse response; + try { + BulkRequestBuilder builder = client.prepareBulk(indexName); + for (Map row : data) { + builder.add(client.prepareIndex().setSource(row).request()); + } + response = builder.get(); + } catch (Exception e) { + throw new IllegalStateException("Failed to bulk index [" + indexName + "]", e); + } + + if (response.hasFailures()) { + throw new IllegalStateException("Failure in bulk response: " + + response.buildFailureMessage()); + } + } + /** * Get field mappings of index by an index expression. Majority is copied from legacy * LocalClusterState. diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchRestClient.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchRestClient.java index d9f9dbbe5d..2937190505 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchRestClient.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/client/OpenSearchRestClient.java @@ -20,6 +20,8 @@ import org.opensearch.action.admin.cluster.settings.ClusterGetSettingsRequest; import org.opensearch.action.admin.indices.settings.get.GetSettingsRequest; import org.opensearch.action.admin.indices.settings.get.GetSettingsResponse; +import org.opensearch.action.bulk.BulkRequest; +import org.opensearch.action.index.IndexRequest; import org.opensearch.action.search.ClearScrollRequest; import org.opensearch.client.RequestOptions; import org.opensearch.client.RestHighLevelClient; @@ -67,6 +69,19 @@ public void createIndex(String indexName, Map mappings) { } } + @Override + public void bulk(String indexName, List> data) { + try { + BulkRequest bulkRequest = new BulkRequest(indexName); + for (Map source : data) { + bulkRequest.add(new IndexRequest().source(source)); + } + client.bulk(bulkRequest, RequestOptions.DEFAULT); + } catch (IOException e) { + throw new IllegalStateException("Failed to bulk index [" + indexName + "]", e); + } + } + @Override public Map getIndexMappings(String... indexExpression) { GetMappingsRequest request = new GetMappingsRequest().indices(indexExpression); diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java index c694769b89..b5f6b5356c 100644 --- a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/OpenSearchIndex.java @@ -7,8 +7,11 @@ package org.opensearch.sql.opensearch.storage; import com.google.common.annotations.VisibleForTesting; +import java.util.ArrayList; import java.util.HashMap; +import java.util.List; import java.util.Map; +import java.util.function.Function; import lombok.RequiredArgsConstructor; import org.opensearch.sql.common.setting.Settings; import org.opensearch.sql.data.type.ExprType; @@ -21,14 +24,18 @@ import org.opensearch.sql.opensearch.request.OpenSearchRequest; import org.opensearch.sql.opensearch.request.system.OpenSearchDescribeIndexRequest; import org.opensearch.sql.opensearch.storage.scan.OpenSearchIndexScanBuilder; +import org.opensearch.sql.opensearch.storage.write.OpenSearchIndexWrite; +import org.opensearch.sql.opensearch.storage.write.OpenSearchIndexWriteBuilder; import org.opensearch.sql.planner.DefaultImplementor; import org.opensearch.sql.planner.logical.LogicalAD; import org.opensearch.sql.planner.logical.LogicalML; import org.opensearch.sql.planner.logical.LogicalMLCommons; import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.logical.LogicalWrite; import org.opensearch.sql.planner.physical.PhysicalPlan; import org.opensearch.sql.storage.Table; import org.opensearch.sql.storage.read.TableScanBuilder; +import org.opensearch.sql.storage.write.TableWriteBuilder; /** OpenSearch table (index) implementation. */ public class OpenSearchIndex implements Table { @@ -125,6 +132,16 @@ public TableScanBuilder createScanBuilder() { return new OpenSearchIndexScanBuilder(indexScan); } + @Override + public TableWriteBuilder createWriteBuilder(LogicalWrite plan) { + // TODO: need to get column in the order when index created + List columns = (plan.getColumns().isEmpty()) + ? new ArrayList<>(getFieldTypes().keySet()) : plan.getColumns(); + Function createIndexWrite = + child -> new OpenSearchIndexWrite(child, client, settings, indexName, columns); + return new OpenSearchIndexWriteBuilder(plan, createIndexWrite); + } + @VisibleForTesting @RequiredArgsConstructor public static class OpenSearchDefaultImplementor diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWrite.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWrite.java new file mode 100644 index 0000000000..754cb44e92 --- /dev/null +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWrite.java @@ -0,0 +1,125 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.opensearch.storage.write; + +import static org.opensearch.sql.data.model.ExprValueUtils.stringValue; +import static org.opensearch.sql.data.model.ExprValueUtils.tupleValue; +import static org.opensearch.sql.executor.ExecutionEngine.Schema; +import static org.opensearch.sql.opensearch.request.OpenSearchRequest.IndexName; + +import com.google.common.collect.ImmutableMap; +import java.util.ArrayList; +import java.util.Arrays; +import java.util.List; +import java.util.Map; +import java.util.stream.Collectors; +import java.util.stream.IntStream; +import org.opensearch.sql.common.setting.Settings; +import org.opensearch.sql.data.model.ExprValue; +import org.opensearch.sql.data.type.ExprCoreType; +import org.opensearch.sql.opensearch.client.OpenSearchClient; +import org.opensearch.sql.planner.physical.PhysicalPlan; +import org.opensearch.sql.storage.write.TableWriteOperator; + +/** + * OpenSearch index write operator. + */ +public class OpenSearchIndexWrite extends TableWriteOperator { + + /** OpenSearch low-level client. */ + private final OpenSearchClient client; + + /** Plugin settings. */ + private final Settings settings; + + /** Index name. */ + private final IndexName indexName; + + /** Column name list. */ + private final List columns; + + /** Counter of indexed documents. */ + private long count; + + public OpenSearchIndexWrite(PhysicalPlan child, + OpenSearchClient client, + Settings settings, + IndexName indexName, + List columns) { + super(child); + this.client = client; + this.settings = settings; + this.indexName = indexName; + this.columns = columns; + } + + @Override + public Schema schema() { + return new Schema(Arrays.asList( + new Schema.Column("message", "message", ExprCoreType.STRING))); + } + + @Override + public void open() { + super.open(); + + do { + List> nextBatch = loadNextBatch(); + if (nextBatch.isEmpty()) { + break; + } + count += nextBatch.size(); + client.bulk(indexName.toString(), nextBatch); + } while (true); + } + + @Override + public boolean hasNext() { + return (count > 0); + } + + @Override + public ExprValue next() { + ExprValue message = tupleValue( + ImmutableMap.of("message", stringValue(count + " row(s) impacted"))); + count = 0; + return message; + } + + @Override + public String explain() { + return indexName.toString(); + } + + // TODO: Add buffer size setting in perf test branch + private List> loadNextBatch() { + List> nextBatch = new ArrayList<>(); + while (input.hasNext()) { + ExprValue row = input.next(); + + // ValuesOperator is special whose result is collection of literal values without names + // Normally, tuple with map from column name to its value is returned from other operators + if (row.type() == ExprCoreType.ARRAY) { + nextBatch.add(loadValues(row)); + } else { + nextBatch.add(loadTuples(row)); + } + } + return nextBatch; + } + + private Map loadValues(ExprValue row) { + // zip column names and values list + List values = row.collectionValue(); + return IntStream.range(0, values.size()).boxed() + .collect(Collectors.toMap(columns::get, i -> values.get(i).value())); + } + + private Map loadTuples(ExprValue row) { + return row.tupleValue().entrySet().stream() + .collect(Collectors.toMap(Map.Entry::getKey, e -> e.getValue().value())); + } +} diff --git a/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteBuilder.java b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteBuilder.java new file mode 100644 index 0000000000..f06f767660 --- /dev/null +++ b/opensearch/src/main/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteBuilder.java @@ -0,0 +1,35 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.opensearch.storage.write; + +import java.util.function.Function; +import org.opensearch.sql.planner.logical.LogicalPlan; +import org.opensearch.sql.planner.physical.PhysicalPlan; +import org.opensearch.sql.storage.write.TableWriteBuilder; +import org.opensearch.sql.storage.write.TableWriteOperator; + +/** + * Builder implementation for OpenSearch index write operator. + */ +public class OpenSearchIndexWriteBuilder extends TableWriteBuilder { + + /** OpenSearch index write operator build function. */ + private final Function buildIndexWrite; + + /** + * Construct OpenSearch index write builder with child node and build function. + */ + public OpenSearchIndexWriteBuilder(LogicalPlan child, + Function buildIndexWrite) { + super(child); + this.buildIndexWrite = buildIndexWrite; + } + + @Override + public TableWriteOperator build(PhysicalPlan child) { + return buildIndexWrite.apply(child); + } +} diff --git a/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteTest.java b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteTest.java new file mode 100644 index 0000000000..5a2ab9048f --- /dev/null +++ b/opensearch/src/test/java/org/opensearch/sql/opensearch/storage/write/OpenSearchIndexWriteTest.java @@ -0,0 +1,107 @@ +/* + * Copyright OpenSearch Contributors + * SPDX-License-Identifier: Apache-2.0 + */ + +package org.opensearch.sql.opensearch.storage.write; + +import static org.hamcrest.MatcherAssert.assertThat; +import static org.hamcrest.Matchers.allOf; +import static org.hamcrest.Matchers.hasItems; +import static org.hamcrest.Matchers.iterableWithSize; +import static org.junit.jupiter.api.Assertions.assertEquals; +import static org.mockito.Mockito.times; +import static org.mockito.Mockito.verify; +import static org.mockito.Mockito.when; +import static org.opensearch.sql.data.model.ExprValueUtils.collectionValue; +import static org.opensearch.sql.data.model.ExprValueUtils.tupleValue; +import static org.opensearch.sql.data.type.ExprCoreType.STRING; + +import com.google.common.collect.ImmutableMap; +import java.util.ArrayList; +import java.util.Arrays; +import java.util.Collections; +import java.util.List; +import java.util.Map; +import org.junit.jupiter.api.BeforeEach; +import org.junit.jupiter.api.Test; +import org.junit.jupiter.api.extension.ExtendWith; +import org.mockito.Mock; +import org.mockito.junit.jupiter.MockitoExtension; +import org.opensearch.sql.common.setting.Settings; +import org.opensearch.sql.data.model.ExprValue; +import org.opensearch.sql.executor.ExecutionEngine; +import org.opensearch.sql.executor.ExecutionEngine.Schema.Column; +import org.opensearch.sql.opensearch.client.OpenSearchClient; +import org.opensearch.sql.opensearch.request.OpenSearchRequest.IndexName; +import org.opensearch.sql.planner.physical.PhysicalPlan; + +@ExtendWith(MockitoExtension.class) +class OpenSearchIndexWriteTest { + + @Mock + private PhysicalPlan input; + + @Mock + private OpenSearchClient client; + + @Mock + private Settings settings; + + private final IndexName indexName = new IndexName("test"); + + private final List columns = Arrays.asList("name", "age"); + + private OpenSearchIndexWrite indexWrite; + + @BeforeEach + void setUp() { + indexWrite = new OpenSearchIndexWrite(input, client, settings, indexName, columns); + } + + @Test + void testSchema() { + assertEquals( + new ExecutionEngine.Schema( + Collections.singletonList(new Column("message", "message", STRING))), + indexWrite.schema()); + } + + @Test + void testLoadValues() { + when(input.hasNext()).thenReturn(true, false); + when(input.next()).thenReturn(collectionValue(Arrays.asList("John", 25))); + + assertThat( + execute(), + allOf( + iterableWithSize(1), + hasItems( + tupleValue(ImmutableMap.of("message", "1 row(s) impacted"))))); + verify(client, times(1)).bulk("test", List.of(Map.of("name", "John", "age", 25))); + } + + @Test + void testLoadTuples() { + when(input.hasNext()).thenReturn(true, false); + when(input.next()).thenReturn(tupleValue(Map.of("name", "John", "age", 25))); + + assertThat( + execute(), + allOf( + iterableWithSize(1), + hasItems( + tupleValue(ImmutableMap.of("message", "1 row(s) impacted"))))); + verify(client, times(1)).bulk("test", List.of(Map.of("name", "John", "age", 25))); + } + + private List execute() { + List results = new ArrayList<>(); + indexWrite.open(); + while (indexWrite.hasNext()) { + results.add(indexWrite.next()); + } + indexWrite.close(); + return results; + } +} \ No newline at end of file