Merge from main

harshavamsi · harshavamsi · commit f7b31b05f0bf · 2025-11-05T22:11:47.000-08:00
Signed-off-by: Harsha Vamsi Kalluri &lt;harshavamsi096@gmail.com&gt;
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -57,6 +57,7 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 - Fix Unified highlighter for nested fields when using matchPhrasePrefixQuery ([#19442](https://github.com/opensearch-project/OpenSearch/pull/19442))
 - Add S3Repository.LEGACY_MD5_CHECKSUM_CALCULATION to list of repository-s3 settings ([#19788](https://github.com/opensearch-project/OpenSearch/pull/19788))
 - Fix NPE of ScriptScoreQuery ([#19650](https://github.com/opensearch-project/OpenSearch/pull/19650))
+- Fix `addEmptyBuckets` while reducing histograms from consuming too much memory and tripping CircuitBreaker ([#17718](https://github.com/opensearch-project/OpenSearch/pull/17718))
 
 ### Dependencies
 - Update to Gradle 9.2 ([#19575](https://github.com/opensearch-project/OpenSearch/pull/19575)) ([#19856](https://github.com/opensearch-project/OpenSearch/pull/19856))
diff --git a/rest-api-spec/src/main/resources/rest-api-spec/test/search.aggregation/10_histogram.yml b/rest-api-spec/src/main/resources/rest-api-spec/test/search.aggregation/10_histogram.yml
@@ -682,3 +682,74 @@ setup:
   - match: { profile.shards.0.aggregations.0.debug.unoptimized_segments: 0 }
   - match: { profile.shards.0.aggregations.0.debug.leaf_visited: 1 }
   - match: { profile.shards.0.aggregations.0.debug.inner_visited: 0 }
+
+---
+"histogram creating empty buckets":
+  - skip:
+      version: " - 2.99.99"
+      reason:  fix currently only in 3.0
+
+  - do:
+      indices.create:
+        index: test_cb
+        body:
+          settings:
+            number_of_replicas: 0
+            number_of_shards: 1
+            refresh_interval: -1
+          mappings:
+            properties:
+              number:
+                type: integer
+
+  - do:
+      bulk:
+        index: test_cb
+        refresh: true
+        body:
+          - '{"index": {}}'
+          - '{"number": 1}'
+          - '{"index": {}}'
+          - '{"number": 500}'
+          - '{"index": {}}'
+          - '{"number": 5000}'
+          - '{"index": {}}'
+          - '{"number": 500000}'
+
+  - do:
+      catch: /circuit_breaking_exception/
+      search:
+        index: test_cb
+        body:
+          size: 0
+          aggs:
+            histo:
+              histogram:
+                field: number
+                interval: 10
+                extended_bounds:
+                  min: 0
+                  max: 174155895372
+
+  - match: { error.type: "search_phase_execution_exception" }
+  - match: { error.caused_by.type: "circuit_breaking_exception"}
+  - match: { status: 429 }
+
+  - do:
+      catch: /too_many_buckets_exception/
+      search:
+        index: test_cb
+        body:
+          size: 0
+          aggs:
+            histo:
+              histogram:
+                field: number
+                interval: 100000
+                extended_bounds:
+                  min: 0
+                  max: 174155895372
+
+  - match: { error.type: "search_phase_execution_exception" }
+  - match: { error.caused_by.type: "too_many_buckets_exception"}
+  - match: { status: 503 }
diff --git a/rest-api-spec/src/main/resources/rest-api-spec/test/search.aggregation/360_date_histogram.yml b/rest-api-spec/src/main/resources/rest-api-spec/test/search.aggregation/360_date_histogram.yml
@@ -160,3 +160,55 @@ setup:
   - match: { profile.shards.0.aggregations.0.debug.unoptimized_segments: 0 }
   - match: { profile.shards.0.aggregations.0.debug.leaf_visited: 0 }
   - match: { profile.shards.0.aggregations.0.debug.inner_visited: 0 }
+
+---
+"date_histogram creating empty buckets":
+  - skip:
+      version: " - 2.99.99"
+      reason:  fix currently only in 3.0
+
+  - do:
+      indices.create:
+        index: test_cb
+        body:
+          settings:
+            number_of_replicas: 0
+            number_of_shards: 1
+            refresh_interval: -1
+          mappings:
+            properties:
+              date:
+                type: date
+
+  - do:
+      bulk:
+        index: test_cb
+        refresh: true
+        body:
+          - '{"index": {}}'
+          - '{"date": "2016-01-01"}'
+          - '{"index": {}}'
+          - '{"date": "2016-01-02"}'
+          - '{"index": {}}'
+          - '{"date": "2016-02-01"}'
+          - '{"index": {}}'
+          - '{"date": "2016-03-01"}'
+
+  - do:
+      catch: /circuit_breaking_exception/
+      search:
+        index: test_cb
+        body:
+          size: 0
+          aggs:
+            histo:
+              date_histogram:
+                field: date
+                interval: 10s
+                extended_bounds:
+                  min: 0
+                  max: 174155895372
+
+  - match: { error.type: "search_phase_execution_exception" }
+  - match: { error.caused_by.type: "circuit_breaking_exception"}
+  - match: { status: 429 }
diff --git a/server/src/main/java/org/opensearch/search/SearchService.java b/server/src/main/java/org/opensearch/search/SearchService.java
@@ -1981,7 +1981,8 @@ public ReduceContext forFinalReduction() {
                     bigArrays,
                     scriptService,
                     multiBucketConsumerService.create(),
-                    pipelineTree
+                    pipelineTree,
+                    multiBucketConsumerService.getBreaker()
                 );
             }
         };
diff --git a/server/src/main/java/org/opensearch/search/aggregations/InternalAggregation.java b/server/src/main/java/org/opensearch/search/aggregations/InternalAggregation.java
@@ -34,6 +34,7 @@
 import org.opensearch.common.annotation.PublicApi;
 import org.opensearch.common.util.BigArrays;
 import org.opensearch.core.common.Strings;
+import org.opensearch.core.common.breaker.CircuitBreaker;
 import org.opensearch.core.common.io.stream.NamedWriteable;
 import org.opensearch.core.common.io.stream.StreamInput;
 import org.opensearch.core.common.io.stream.StreamOutput;
@@ -97,6 +98,7 @@ public static class ReduceContext {
         private final PipelineTree pipelineTreeRoot;
 
         private boolean isSliceLevel;
+        private final CircuitBreaker breaker;
         /**
          * Supplies the pipelines when the result of the reduce is serialized
          * to node versions that need pipeline aggregators to be serialized
@@ -112,13 +114,30 @@ public static ReduceContext forPartialReduction(
             ScriptService scriptService,
             Supplier<PipelineTree> pipelineTreeForBwcSerialization
         ) {
-            return new ReduceContext(bigArrays, scriptService, (s) -> {}, null, pipelineTreeForBwcSerialization);
+            return new ReduceContext(bigArrays, scriptService, (s) -> {}, null, pipelineTreeForBwcSerialization, null);
         }
 
         /**
          * Build a {@linkplain ReduceContext} to perform the final reduction.
          * @param pipelineTreeRoot The root of tree of pipeline aggregations for this request
          */
+        public static ReduceContext forFinalReduction(
+            BigArrays bigArrays,
+            ScriptService scriptService,
+            IntConsumer multiBucketConsumer,
+            PipelineTree pipelineTreeRoot,
+            CircuitBreaker breaker
+        ) {
+            return new ReduceContext(
+                bigArrays,
+                scriptService,
+                multiBucketConsumer,
+                requireNonNull(pipelineTreeRoot, "prefer EMPTY to null"),
+                () -> pipelineTreeRoot,
+                breaker
+            );
+        }
+
         public static ReduceContext forFinalReduction(
             BigArrays bigArrays,
             ScriptService scriptService,
@@ -130,7 +149,8 @@ public static ReduceContext forFinalReduction(
                 scriptService,
                 multiBucketConsumer,
                 requireNonNull(pipelineTreeRoot, "prefer EMPTY to null"),
-                () -> pipelineTreeRoot
+                () -> pipelineTreeRoot,
+                null
             );
         }
 
@@ -139,14 +159,16 @@ private ReduceContext(
             ScriptService scriptService,
             IntConsumer multiBucketConsumer,
             PipelineTree pipelineTreeRoot,
-            Supplier<PipelineTree> pipelineTreeForBwcSerialization
+            Supplier<PipelineTree> pipelineTreeForBwcSerialization,
+            CircuitBreaker breaker
         ) {
             this.bigArrays = bigArrays;
             this.scriptService = scriptService;
             this.multiBucketConsumer = multiBucketConsumer;
             this.pipelineTreeRoot = pipelineTreeRoot;
             this.pipelineTreeForBwcSerialization = pipelineTreeForBwcSerialization;
             this.isSliceLevel = false;
+            this.breaker = breaker;
         }
 
         /**
@@ -210,6 +232,9 @@ public void consumeBucketsAndMaybeBreak(int size) {
             multiBucketConsumer.accept(size);
         }
 
+        public CircuitBreaker getBreaker() {
+            return breaker;
+        }
     }
 
     protected final String name;
diff --git a/server/src/main/java/org/opensearch/search/aggregations/MultiBucketConsumerService.java b/server/src/main/java/org/opensearch/search/aggregations/MultiBucketConsumerService.java
@@ -218,4 +218,9 @@ public int getLimit() {
     public MultiBucketConsumer create() {
         return new MultiBucketConsumer(maxBucket, breaker);
     }
+
+    public CircuitBreaker getBreaker() {
+        return breaker;
+    }
+
 }
diff --git a/server/src/main/java/org/opensearch/search/aggregations/bucket/histogram/InternalDateHistogram.java b/server/src/main/java/org/opensearch/search/aggregations/bucket/histogram/InternalDateHistogram.java
@@ -34,6 +34,7 @@
 import org.apache.lucene.util.CollectionUtil;
 import org.apache.lucene.util.PriorityQueue;
 import org.opensearch.common.Rounding;
+import org.opensearch.core.common.breaker.CircuitBreaker;
 import org.opensearch.core.common.io.stream.StreamInput;
 import org.opensearch.core.common.io.stream.StreamOutput;
 import org.opensearch.core.xcontent.XContentBuilder;
@@ -58,6 +59,9 @@
 import java.util.Map;
 import java.util.Objects;
 
+import static java.lang.Math.max;
+import static java.lang.Math.min;
+
 /**
  * Implementation of {@link Histogram}.
  *
@@ -322,7 +326,7 @@ public Bucket createBucket(InternalAggregations aggregations, Bucket prototype)
         return new Bucket(prototype.key, prototype.docCount, prototype.keyed, prototype.format, aggregations);
     }
 
-    private List<Bucket> reduceBuckets(List<InternalAggregation> aggregations, ReduceContext reduceContext) {
+    List<Bucket> reduceBuckets(List<InternalAggregation> aggregations, ReduceContext reduceContext) {
         final PriorityQueue<IteratorAndCurrent<Bucket>> pq = new PriorityQueue<IteratorAndCurrent<Bucket>>(aggregations.size()) {
             @Override
             protected boolean lessThan(IteratorAndCurrent<Bucket> a, IteratorAndCurrent<Bucket> b) {
@@ -394,9 +398,48 @@ protected Bucket reduceBucket(List<Bucket> buckets, ReduceContext context) {
         return createBucket(buckets.get(0).key, docCount, aggs);
     }
 
-    private void addEmptyBuckets(List<Bucket> list, ReduceContext reduceContext) {
+    private int estimateTotalBucketCount(List<Bucket> list) {
+        LongBounds bounds = emptyBucketInfo.bounds;
+        int bucketCount = 0;
+        if (bounds != null && bounds.getMin() != null && bounds.getMax() != null) {
+            long min = min(bounds.getMin() + offset, list.getFirst().key);
+            long max = max(bounds.getMax() + offset, list.getLast().key);
+            long intervalWidth = 0;
+            int i = 0;
+            long key = min;
+            while (key < max && i++ < 10) {
+                bucketCount++;
+                long nextKey = nextKey(key).longValue();
+                intervalWidth = max(intervalWidth, nextKey - key);
+                key = nextKey;
+            }
+            if (bucketCount < 10) {
+                return bucketCount;
+            }
+            long estimatedBuckets = Math.round(Math.ceil((double) (max - min) / intervalWidth));
+            if (estimatedBuckets > Integer.MAX_VALUE) {
+                return Integer.MAX_VALUE;
+            }
+            return (int) estimatedBuckets;
+        }
+        return list.size();
+    }
+
+    void addEmptyBuckets(List<Bucket> list, ReduceContext reduceContext) {
         Bucket lastBucket = null;
         LongBounds bounds = emptyBucketInfo.bounds;
+        final int originalSize = list.size();
+        // we use counts here only to add those values to the CircuitBreaker, list's count has already been added in #reduce, so we only
+        // need to add emptyBucketCount
+        final int estimateEmptyBucketCount = estimateTotalBucketCount(list) - originalSize;
+        assert estimateEmptyBucketCount >= 0;
+        CircuitBreaker breaker = reduceContext.getBreaker();
+        if (breaker != null) {
+            // 50 bytes memory usage for each empty bucket
+            breaker.addEstimateBytesAndMaybeBreak(50L * estimateEmptyBucketCount, "empty date histogram buckets");
+        }
+        reduceContext.consumeBucketsAndMaybeBreak(estimateEmptyBucketCount);
+
         ListIterator<Bucket> iter = list.listIterator();
 
         // first adding all the empty buckets *before* the actual data (based on th extended_bounds.min the user requested)
@@ -452,11 +495,16 @@ private void addEmptyBuckets(List<Bucket> list, ReduceContext reduceContext) {
                 key = nextKey(key).longValue();
             }
         }
+        int postAddEmptyBucketCount = list.size() - estimateEmptyBucketCount - originalSize;
+        if (postAddEmptyBucketCount > 0) {
+            reduceContext.consumeBucketsAndMaybeBreak(postAddEmptyBucketCount);
+        }
     }
 
     @Override
     public InternalAggregation reduce(List<InternalAggregation> aggregations, ReduceContext reduceContext) {
         List<Bucket> reducedBuckets = reduceBuckets(aggregations, reduceContext);
+        reduceContext.consumeBucketsAndMaybeBreak(reducedBuckets.size());
         if (reduceContext.isFinalReduce()) {
             if (minDocCount == 0) {
                 addEmptyBuckets(reducedBuckets, reduceContext);
@@ -473,7 +521,6 @@ public InternalAggregation reduce(List<InternalAggregation> aggregations, Reduce
                 CollectionUtil.introSort(reducedBuckets, order.comparator());
             }
         }
-        reduceContext.consumeBucketsAndMaybeBreak(reducedBuckets.size());
         return new InternalDateHistogram(
             getName(),
             reducedBuckets,
diff --git a/server/src/main/java/org/opensearch/search/aggregations/bucket/histogram/InternalHistogram.java b/server/src/main/java/org/opensearch/search/aggregations/bucket/histogram/InternalHistogram.java
diff --git a/server/src/test/java/org/opensearch/search/aggregations/bucket/histogram/InternalDateHistogramTests.java b/server/src/test/java/org/opensearch/search/aggregations/bucket/histogram/InternalDateHistogramTests.java
diff --git a/server/src/test/java/org/opensearch/search/aggregations/bucket/histogram/InternalHistogramTests.java b/server/src/test/java/org/opensearch/search/aggregations/bucket/histogram/InternalHistogramTests.java

Original file line number	Diff line number	Diff line change
`@@ -218,4 +218,9 @@ public int getLimit() {`
`218`	`218`	`public MultiBucketConsumer create() {`
`219`	`219`	`return new MultiBucketConsumer(maxBucket, breaker);`
`220`	`220`	`}`
	`221`	`+`
	`222`	`+ public CircuitBreaker getBreaker() {`
	`223`	`+ return breaker;`
	`224`	`+ }`
	`225`	`+`
`221`	`226`	`}`