opensearch-project · penghuo · Jul 17, 2025 · Jul 15, 2025 · Jul 15, 2025 · Jul 16, 2025
diff --git a/core/src/main/java/org/opensearch/sql/calcite/CalcitePlanContext.java b/core/src/main/java/org/opensearch/sql/calcite/CalcitePlanContext.java
@@ -56,7 +56,7 @@ private CalcitePlanContext(FrameworkConfig config, Integer querySizeLimit, Query
     this.config = config;
     this.querySizeLimit = querySizeLimit;
     this.queryType = queryType;
-    this.connection = CalciteToolsHelper.connect(config, TYPE_FACTORY);
+    this.connection = CalciteToolsHelper.connect(config, TYPE_FACTORY, querySizeLimit);
     this.relBuilder = CalciteToolsHelper.create(config, TYPE_FACTORY, connection);
     this.rexBuilder = new ExtendedRexBuilder(relBuilder.getRexBuilder());
     this.functionProperties = new FunctionProperties(QueryType.PPL);

@@ -16,5 +16,5 @@
  */
 public interface Scannable {
 
-  public Enumerable<@Nullable Object> scan();
+  public Enumerable<@Nullable Object> scan(Integer querySizeLimit);
 }
@@ -37,8 +37,10 @@
 import java.time.Instant;
 import java.util.Properties;
 import java.util.function.Consumer;
+import lombok.RequiredArgsConstructor;
 import org.apache.calcite.adapter.enumerable.EnumerableConvention;
 import org.apache.calcite.adapter.enumerable.EnumerableRel;
+import org.apache.calcite.adapter.enumerable.EnumerableRel.Prefer;
 import org.apache.calcite.adapter.java.JavaTypeFactory;
 import org.apache.calcite.avatica.AvaticaConnection;
 import org.apache.calcite.avatica.AvaticaFactory;
@@ -113,15 +115,16 @@ public static RelBuilder create(
             new OpenSearchRelBuilder(config.getContext(), cluster, relOptSchema));
   }
 
-  public static Connection connect(FrameworkConfig config, JavaTypeFactory typeFactory) {
+  public static Connection connect(
+      FrameworkConfig config, JavaTypeFactory typeFactory, Integer querySizeLimit) {
     final Properties info = new Properties();
     if (config.getTypeSystem() != RelDataTypeSystem.DEFAULT) {
       info.setProperty(
           CalciteConnectionProperty.TYPE_SYSTEM.camelName(),
           config.getTypeSystem().getClass().getName());
     }
     try {
-      return new OpenSearchDriver().connect("jdbc:calcite:", info, null, typeFactory);
+      return new OpenSearchDriver(querySizeLimit).connect("jdbc:calcite:", info, null, typeFactory);
     } catch (SQLException e) {
       throw new RuntimeException(e);
     }
@@ -147,13 +150,16 @@ private static <R> R withPrepare(
       }
       final CalciteServerStatement statement =
           connection.createStatement().unwrap(CalciteServerStatement.class);
-      return new OpenSearchPrepareImpl().perform(statement, config, typeFactory, action);
+      // QUERY_SIZE_LIMIT only takes effect in execution, not in planning.
+      return new OpenSearchPrepareImpl(null).perform(statement, config, typeFactory, action);
     } catch (Exception e) {
       throw new RuntimeException(e);
     }
   }
 
+  @RequiredArgsConstructor
   public static class OpenSearchDriver extends Driver {
+    private final Integer querySizeLimit;
 
     public Connection connect(
         String url, Properties info, CalciteSchema rootSchema, JavaTypeFactory typeFactory)
@@ -171,7 +177,7 @@ public Connection connect(
 
     @Override
     protected Function0<CalcitePrepare> createPrepareFactory() {
-      return OpenSearchPrepareImpl::new;
+      return () -> new OpenSearchPrepareImpl(querySizeLimit);
     }
   }
 
@@ -208,7 +214,10 @@ public AggCall avg(boolean distinct, String alias, RexNode operand) {
   public static final SqlAggFunction VAR_SAMP_NULLABLE =
       new NullableSqlAvgAggFunction(SqlKind.VAR_SAMP);
 
+  @RequiredArgsConstructor
   public static class OpenSearchPrepareImpl extends CalcitePrepareImpl {
+    private final Integer QUERY_SIZE_LIMIT;
+
     /**
      * Similar to {@link CalcitePrepareImpl#perform(CalciteServerStatement, FrameworkConfig,
      * Frameworks.BasePrepareAction)}, but with a custom typeFactory.
@@ -263,7 +272,8 @@ protected CalcitePrepareImpl.CalcitePreparingStmt getPreparingStmt(
           prefer,
           createCluster(planner, new RexBuilder(typeFactory)),
           resultConvention,
-          createConvertletTable());
+          createConvertletTable(),
+          QUERY_SIZE_LIMIT);
     }
   }
 
@@ -273,17 +283,19 @@ protected CalcitePrepareImpl.CalcitePreparingStmt getPreparingStmt(
    */
   public static class OpenSearchCalcitePreparingStmt
       extends CalcitePrepareImpl.CalcitePreparingStmt {
+    private final Integer QUERY_SIZE_LIMIT;
 
     public OpenSearchCalcitePreparingStmt(
         CalcitePrepareImpl prepare,
         CalcitePrepare.Context context,
         CatalogReader catalogReader,
         RelDataTypeFactory typeFactory,
         CalciteSchema schema,
-        EnumerableRel.Prefer prefer,
+        Prefer prefer,
         RelOptCluster cluster,
         Convention resultConvention,
-        SqlRexConvertletTable convertletTable) {
+        SqlRexConvertletTable convertletTable,
+        Integer querySizeLimit) {
       super(
           prepare,
           context,
@@ -294,6 +306,7 @@ public OpenSearchCalcitePreparingStmt(
           cluster,
           resultConvention,
           convertletTable);
+      this.QUERY_SIZE_LIMIT = querySizeLimit;
     }
 
     @Override
@@ -302,7 +315,7 @@ protected PreparedResult implement(RelRoot root) {
       RelDataType resultType = root.rel.getRowType();
       boolean isDml = root.kind.belongsTo(SqlKind.DML);
       if (root.rel instanceof Scannable scannable) {
-        final Bindable bindable = dataContext -> scannable.scan();
+        final Bindable bindable = dataContext -> scannable.scan(QUERY_SIZE_LIMIT);
 
         return new PreparedResultImpl(
             resultType,

@@ -98,9 +98,7 @@ public void executeWithCalcite(
               () -> {
                 CalcitePlanContext context =
                     CalcitePlanContext.create(
-                        buildFrameworkConfig(),
-                        settings.getSettingValue(Key.QUERY_SIZE_LIMIT),
-                        queryType);
+                        buildFrameworkConfig(), getQuerySizeLimit(), queryType);
                 RelNode relNode = analyze(plan, context);
                 RelNode optimized = optimize(relNode);
                 RelNode calcitePlan = convertToCalcitePlan(optimized);

diff --git a/core/src/test/java/org/opensearch/sql/calcite/CalciteRexNodeVisitorTest.java b/core/src/test/java/org/opensearch/sql/calcite/CalciteRexNodeVisitorTest.java
@@ -62,7 +62,7 @@ public void setUpContext() {
     when(relBuilder.getRexBuilder()).thenReturn(rexBuilder);
     when(rexBuilder.getTypeFactory()).thenReturn(TYPE_FACTORY);
     mockedStatic = Mockito.mockStatic(CalciteToolsHelper.class);
-    mockedStatic.when(() -> CalciteToolsHelper.connect(any(), any())).thenReturn(connection);
+    mockedStatic.when(() -> CalciteToolsHelper.connect(any(), any(), any())).thenReturn(connection);
 
     mockedStatic.when(() -> CalciteToolsHelper.create(any(), any(), any())).thenReturn(relBuilder);
 

@@ -1,6 +1,6 @@
 {
   "calcite": {
     "logical": "LogicalProject(age=[$8])\n  LogicalSort(offset=[2], fetch=[10])\n    LogicalSort(offset=[1], fetch=[10])\n      CalciteLogicalIndexScan(table=[[OpenSearch, opensearch-sql_test_index_account]])\n",
-    "physical": "CalciteEnumerableIndexScan(table=[[OpenSearch, opensearch-sql_test_index_account]], PushDownContext=[[LIMIT->10, LIMIT->10, PROJECT->[age]], OpenSearchRequestBuilder(sourceBuilder={\"from\":3,\"size\":8,\"timeout\":\"1m\",\"_source\":{\"includes\":[\"age\"],\"excludes\":[]}}, requestedTotalSize=8, pageSize=null, startFrom=3)])\n"
+    "physical": "CalciteEnumerableIndexScan(table=[[OpenSearch, opensearch-sql_test_index_account]], PushDownContext=[[LIMIT->10, PROJECT->[age], LIMIT->10], OpenSearchRequestBuilder(sourceBuilder={\"from\":3,\"size\":8,\"timeout\":\"1m\",\"_source\":{\"includes\":[\"age\"],\"excludes\":[]}}, requestedTotalSize=8, pageSize=null, startFrom=3)])\n"
   }
-}
+}
@@ -1,6 +1,6 @@
 {
   "calcite": {
     "logical": "LogicalProject(age=[$8])\n  LogicalSort(fetch=[10])\n    LogicalSort(fetch=[5])\n      CalciteLogicalIndexScan(table=[[OpenSearch, opensearch-sql_test_index_account]])\n",
-    "physical": "EnumerableLimit(fetch=[10])\n  CalciteEnumerableIndexScan(table=[[OpenSearch, opensearch-sql_test_index_account]], PushDownContext=[[LIMIT->5, PROJECT->[age]], OpenSearchRequestBuilder(sourceBuilder={\"from\":0,\"size\":5,\"timeout\":\"1m\",\"_source\":{\"includes\":[\"age\"],\"excludes\":[]}}, requestedTotalSize=5, pageSize=null, startFrom=0)])\n"
+    "physical": "CalciteEnumerableIndexScan(table=[[OpenSearch, opensearch-sql_test_index_account]], PushDownContext=[[LIMIT->5, PROJECT->[age], LIMIT->10], OpenSearchRequestBuilder(sourceBuilder={\"from\":0,\"size\":5,\"timeout\":\"1m\",\"_source\":{\"includes\":[\"age\"],\"excludes\":[]}}, requestedTotalSize=5, pageSize=null, startFrom=0)])\n"
   }
 }
@@ -88,7 +88,7 @@ public double estimateRowCount(RelMetadataQuery mq) {
                       case PROJECT, SORT -> rowCount;
                       case FILTER -> NumberUtil.multiply(
                           rowCount, RelMdUtil.guessSelectivity((RexNode) action.digest));
-                      case LIMIT -> (Integer) action.digest;
+                      case LIMIT -> Math.min(rowCount, (Integer) action.digest);
                     }
                     * estimateRowCountFactor,
             (a, b) -> null);

@@ -88,12 +88,16 @@ public Result implement(EnumerableRelImplementor implementor, Prefer pref) {
    * or SearchAfter recorded during previous search.
    */
   @Override
-  public Enumerable<@Nullable Object> scan() {
+  public Enumerable<@Nullable Object> scan(Integer querySizeLimit) {
     return new AbstractEnumerable<>() {
       @Override
       public Enumerator<Object> enumerator() {
         OpenSearchRequestBuilder requestBuilder = osIndex.createRequestBuilder();
         pushDownContext.forEach(action -> action.apply(requestBuilder));
+        // For the simple plan with only scan, try to push down querySizeLimit to avoid PIT search
+        if (querySizeLimit != null && querySizeLimit > 0 && !pushDownContext.isAggregatePushed()) {
+          requestBuilder.pushDownLimit(querySizeLimit, 0);
+        }
         return new OpenSearchIndexEnumerator(
             osIndex.getClient(),
             getFieldPath(),
@@ -104,6 +108,10 @@ public Enumerator<Object> enumerator() {
     };
   }
 
+  public Enumerable<@Nullable Object> scan() {
+    return scan(null);
+  }
+
   private List<String> getFieldPath() {
     return getRowType().getFieldNames().stream()
         .map(f -> osIndex.getAliasMapping().getOrDefault(f, f))