elastic · iverase · Nov 28, 2019 · Oct 28, 2019 · Oct 28, 2019 · Oct 28, 2019
diff --git a/docs/reference/aggregations/metrics/percentile-aggregation.asciidoc b/docs/reference/aggregations/metrics/percentile-aggregation.asciidoc
@@ -3,8 +3,8 @@
 
 A `multi-value` metrics aggregation that calculates one or more percentiles
 over numeric values extracted from the aggregated documents. These values can be
-generated by a provided script or extracted from specific numeric or histogram
-fields in the documents.
+generated by a provided script or extracted from specific numeric or
+<<histogram,histogram fields>> in the documents.
 
 Percentiles show the point at which a certain percentage of observed values
 occur.  For example, the 95th percentile is the value which is greater than 95%

diff --git a/docs/reference/aggregations/metrics/percentile-rank-aggregation.asciidoc b/docs/reference/aggregations/metrics/percentile-rank-aggregation.asciidoc
@@ -3,8 +3,8 @@
 
 A `multi-value` metrics aggregation that calculates one or more percentile ranks
 over numeric values extracted from the aggregated documents. These values can be
-generated by a provided script or extracted from specific numeric or histogram
-fields in the documents.
+generated by a provided script or extracted from specific numeric or
+<<histogram,histogram fields>> in the documents.
 
 [NOTE]
 ==================================================

diff --git a/docs/reference/mapping/types/histogram.asciidoc b/docs/reference/mapping/types/histogram.asciidoc
@@ -39,23 +39,26 @@ following aggregations and queries:
 * <<search-aggregations-metrics-percentile-rank-aggregation,percentile ranks>> aggregation
 * <<query-dsl-exists-query,exists>> query
 
-We recommend you define the buckets in the `values` array based on the type of aggregation you intended to use.
-
 [[mapping-types-histogram-building-histogram]]
 ==== Building a histogram
 
 When using a histogram as part of an aggregation, the accuracy of the results will depend on how the
 histogram was constructed. It is important to consider the percentiles aggregation mode that will be used
 to build it. Some possibilities include:
 
-- For the <<search-aggregations-metrics-percentile-aggregation, T-Digest>> mode, histograms
-can be built by using the mean value of the centroids and the centroid's count. If the algorithm has already
-started to approximate the percentiles, this inaccuracy is carried over in the histogram.
+- For the <<search-aggregations-metrics-percentile-aggregation, T-Digest>> mode, the `values` array represents
+the mean centroid positions and the `counts` array represents the number of values that are attributed to each
+centroid. If the algorithm has already started to approximate the percentiles, this inaccuracy is
+carried over in the histogram.
+
+- For the <<_hdr_histogram,High Dynamic Range (HDR)>> histogram mode, the `values` array represents fixed upper
+limits of each bucket interval, and the `counts` array represents the number of values that are attributed to each
+interval. This implementation maintains a fixed worse-case percentage error (specified as a number of significant digits),
+therefore the value used when generating the histogram would be the maximum accuracy you can achieve at aggregation time.
 
-- For the <<_hdr_histogram,High Dynamic Range (HDR)>> histogram mode, histograms
-can be created by using the recorded values and the count at that value. This implementation maintains a fixed worse-case
-percentage error (specified as a number of significant digits), therefore the value used when generating the histogram
-would be the maximum accuracy you can achieve at aggregation time.
+The histogram field is "algorithm agnostic" and does not store data specific to either T-Digest or HDRHistogram. While this
+means the field can technically be aggregated with either algorithm, in practice the user should chose one algorithm and
+index data in that manner (e.g. centroids for T-Digest or intervals for HDRHistogram) to ensure best accuracy.
 
 [[histogram-ex]]
 ==== Examples

diff --git a/.../java/org/elasticsearch/search/aggregations/metrics/AbstractHDRPercentilesAggregator.java b/.../java/org/elasticsearch/search/aggregations/metrics/AbstractHDRPercentilesAggregator.java
@@ -112,7 +112,7 @@ public void collect(int doc, long bucket) throws IOException {
                 DoubleHistogram state = getExistingOrNewHistogram(bigArrays, bucket);
                 if (values.advanceExact(doc)) {
                     final HistogramValue sketch = values.histogram();
-                    while(sketch.next()) {
+                    while (sketch.next()) {
                         state.recordValueWithCount(sketch.value(), sketch.count());
                     }
                 }

diff --git a/...nalytics/src/main/java/org/elasticsearch/xpack/analytics/mapper/HistogramFieldMapper.java b/...nalytics/src/main/java/org/elasticsearch/xpack/analytics/mapper/HistogramFieldMapper.java
@@ -26,6 +26,7 @@
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.xcontent.XContentBuilder;
 import org.elasticsearch.common.xcontent.XContentParser;
+import org.elasticsearch.common.xcontent.XContentSubParser;
 import org.elasticsearch.common.xcontent.support.XContentMapValues;
 import org.elasticsearch.index.IndexSettings;
 import org.elasticsearch.index.fielddata.AtomicHistogramFieldData;
@@ -298,8 +299,8 @@ private HistogramValue getHistogramValue(final BytesRef bytesRef) throws IOExcep
                         @Override
                         public boolean next() throws IOException {
                             if (streamInput.available() > 0) {
-                                value = streamInput.readDouble();
                                 count = streamInput.readVInt();
+                                value = streamInput.readDouble();
                                 return true;
                             }
                             isExhausted = true;
@@ -352,7 +353,7 @@ public void parse(ParseContext context) throws IOException {
         }
         context.path().add(simpleName());
         XContentParser.Token token = null;
-        int level = 0;
+        XContentSubParser subParser = null;
         try {
             token = context.parser().currentToken();
             if (token == XContentParser.Token.VALUE_NULL) {
@@ -363,22 +364,23 @@ public void parse(ParseContext context) throws IOException {
             IntArrayList counts = null;
             // should be an object
             ensureExpectedToken(XContentParser.Token.START_OBJECT, token, context.parser()::getTokenLocation);
-            token = context.parser().nextToken();
+            subParser = new XContentSubParser(context.parser());
+            token = subParser.nextToken();
             while (token != XContentParser.Token.END_OBJECT) {
                 // should be an field
-                ensureExpectedToken(XContentParser.Token.FIELD_NAME, token, context.parser()::getTokenLocation);
-                String fieldName = context.parser().currentName();
+                ensureExpectedToken(XContentParser.Token.FIELD_NAME, token, subParser::getTokenLocation);
+                String fieldName = subParser.currentName();
                 if (fieldName.equals(VALUES_FIELD.getPreferredName())) {
-                    token = context.parser().nextToken();
+                    token = subParser.nextToken();
                     // should be an array
-                    ensureExpectedToken(XContentParser.Token.START_ARRAY, token, context.parser()::getTokenLocation);
+                    ensureExpectedToken(XContentParser.Token.START_ARRAY, token, subParser::getTokenLocation);
                     values = new DoubleArrayList();
-                    token = context.parser().nextToken();
+                    token = subParser.nextToken();
                     double previousVal = -Double.MAX_VALUE;
                     while (token != XContentParser.Token.END_ARRAY) {
                         // should be a number
-                        ensureExpectedToken(XContentParser.Token.VALUE_NUMBER, token, context.parser()::getTokenLocation);
-                        double val = context.parser().doubleValue();
+                        ensureExpectedToken(XContentParser.Token.VALUE_NUMBER, token, subParser::getTokenLocation);
+                        double val = subParser.doubleValue();
                         if (val < previousVal) {
                             // values must be in increasing order
                             throw new MapperParsingException("error parsing field ["
@@ -387,28 +389,26 @@ public void parse(ParseContext context) throws IOException {
                         }
                         values.add(val);
                         previousVal = val;
-                        token = context.parser().nextToken();
+                        token = subParser.nextToken();
                     }
                 } else if (fieldName.equals(COUNTS_FIELD.getPreferredName())) {
-                    token = context.parser().nextToken();
+                    token = subParser.nextToken();
                     // should be an array
-                    ensureExpectedToken(XContentParser.Token.START_ARRAY, token, context.parser()::getTokenLocation);
+                    ensureExpectedToken(XContentParser.Token.START_ARRAY, token, subParser::getTokenLocation);
                     counts = new IntArrayList();
-                    token = context.parser().nextToken();
+                    token = subParser.nextToken();
                     while (token != XContentParser.Token.END_ARRAY) {
                         // should be a number
-                        ensureExpectedToken(XContentParser.Token.VALUE_NUMBER, token, context.parser()::getTokenLocation);
-                        counts.add(context.parser().intValue());
-                        token = context.parser().nextToken();
+                        ensureExpectedToken(XContentParser.Token.VALUE_NUMBER, token, subParser::getTokenLocation);
+                        counts.add(subParser.intValue());
+                        token = subParser.nextToken();
                     }
                 } else {
                     throw new MapperParsingException("error parsing field [" +
                         name() + "], with unknown parameter [" + fieldName + "]");
                 }
-                token = context.parser().nextToken();
-                level = maybeAddOrRemoveLevel(token, level);
+                token = subParser.nextToken();
             }
-            level = 0;
             if (values == null) {
                 throw new MapperParsingException("error parsing field ["
                     + name() + "], expected field called [" + VALUES_FIELD.getPreferredName() + "]");
@@ -431,8 +431,8 @@ public void parse(ParseContext context) throws IOException {
                             + name() + "], ["+ COUNTS_FIELD + "] elements must be >= 0 but got " + counts.get(i));
                     } else if (count > 0) {
                         // we do not add elements with count == 0
-                        streamOutput.writeDouble(values.get(i));
                         streamOutput.writeVInt(count);
+                        streamOutput.writeDouble(values.get(i));
                     }
                 }
 
@@ -451,27 +451,16 @@ public void parse(ParseContext context) throws IOException {
                     ex, fieldType().name(), fieldType().typeName());
             }
             // we need to advance until the end of the field
-            if (token != null) {
-                while (level > 0 || token != XContentParser.Token.END_OBJECT) {
-                    level = maybeAddOrRemoveLevel(token, level);
-                    token = context.parser().nextToken();
+            if (subParser != null) {
+                while (token != null) {
+                    token = subParser.nextToken();
                 }
             }
             context.addIgnoredField(fieldType().name());
         }
         context.path().remove();
     }
 
-    private int maybeAddOrRemoveLevel(XContentParser.Token token, int level) {
-        if (token == XContentParser.Token.START_OBJECT) {
-            return ++level;
-        }
-        if (token == XContentParser.Token.END_OBJECT) {
-            return --level;
-        }
-        return level;
-    }
-
     @Override
     protected void doXContentBody(XContentBuilder builder, boolean includeDefaults, Params params) throws IOException {
         super.doXContentBody(builder, includeDefaults, params);

diff --git a/.../elasticsearch/xpack/analytics/mapper/HDRPreAggregatedPercentileRanksAggregatorTests.java b/.../elasticsearch/xpack/analytics/mapper/HDRPreAggregatedPercentileRanksAggregatorTests.java
@@ -40,11 +40,10 @@ private BinaryDocValuesField getDocValue(String fieldName, double[] values) thro
         Iterator<DoubleHistogramIterationValue> iterator = recordedValues.iterator();
         while (iterator.hasNext()) {
             DoubleHistogramIterationValue value = iterator.next();
-            double d = value.getValueIteratedTo();
-            streamOutput.writeDouble(d);
             long count = value.getCountAtValueIteratedTo();
             streamOutput.writeVInt(Math.toIntExact(count));
-
+            double d = value.getValueIteratedTo();
+            streamOutput.writeDouble(d);
         }
         return new BinaryDocValuesField(fieldName, streamOutput.bytes().toBytesRef());
     }

diff --git a/.../org/elasticsearch/xpack/analytics/mapper/HDRPreAggregatedPercentilesAggregatorTests.java b/.../org/elasticsearch/xpack/analytics/mapper/HDRPreAggregatedPercentilesAggregatorTests.java
@@ -47,9 +47,9 @@ private BinaryDocValuesField getDocValue(String fieldName, double[] values) thro
            DoubleHistogramIterationValue value = iterator.next();
            long count = value.getCountAtValueIteratedTo();
            if (count != 0) {
+               streamOutput.writeVInt(Math.toIntExact(count));
                double d = value.getValueIteratedTo();
                streamOutput.writeDouble(d);
-               streamOutput.writeVInt(Math.toIntExact(count));
            }
 
        }

diff --git a/...ics/src/test/java/org/elasticsearch/xpack/analytics/mapper/HistogramFieldMapperTests.java b/...ics/src/test/java/org/elasticsearch/xpack/analytics/mapper/HistogramFieldMapperTests.java
@@ -156,6 +156,48 @@ public void testIgnoreMalformed() throws Exception {
         assertThat(doc.rootDoc().getField("pre_aggregated"), nullValue());
     }
 
+    public void testIgnoreMalformedSkipsKeyword() throws Exception {
+        ensureGreen();
+        XContentBuilder xContentBuilder = XContentFactory.jsonBuilder().startObject().startObject("_doc")
+            .startObject("properties").startObject("pre_aggregated").field("type", "histogram")
+            .field("ignore_malformed", true)
+            .endObject().startObject("otherField").field("type", "keyword");
+        String mapping = Strings.toString(xContentBuilder.endObject().endObject().endObject().endObject());
+        DocumentMapper defaultMapper = createIndex("test").mapperService().documentMapperParser()
+            .parse("_doc", new CompressedXContent(mapping));
+
+        ParsedDocument doc = defaultMapper.parse(new SourceToParse("test", "1",
+            BytesReference.bytes(XContentFactory.jsonBuilder()
+                .startObject().field("pre_aggregated", "value")
+                .field("otherField","value")
+                .endObject()),
+            XContentType.JSON));
+
+        assertThat(doc.rootDoc().getField("pre_aggregated"), nullValue());
+        assertThat(doc.rootDoc().getField("otherField"), notNullValue());
+    }
+
+    public void testIgnoreMalformedSkipsArray() throws Exception {
+        ensureGreen();
+        XContentBuilder xContentBuilder = XContentFactory.jsonBuilder().startObject().startObject("_doc")
+            .startObject("properties").startObject("pre_aggregated").field("type", "histogram")
+            .field("ignore_malformed", true)
+            .endObject().startObject("otherField").field("type", "keyword");
+        String mapping = Strings.toString(xContentBuilder.endObject().endObject().endObject().endObject());
+        DocumentMapper defaultMapper = createIndex("test").mapperService().documentMapperParser()
+            .parse("_doc", new CompressedXContent(mapping));
+
+        ParsedDocument doc = defaultMapper.parse(new SourceToParse("test", "1",
+            BytesReference.bytes(XContentFactory.jsonBuilder()
+                .startObject().field("pre_aggregated", new int[] {2, 2, 2})
+                .field("otherField","value")
+                .endObject()),
+            XContentType.JSON));
+
+        assertThat(doc.rootDoc().getField("pre_aggregated"), nullValue());
+        assertThat(doc.rootDoc().getField("otherField"), notNullValue());
+    }
+
     public void testIgnoreMalformedSkipsField() throws Exception {
         ensureGreen();
         XContentBuilder xContentBuilder = XContentFactory.jsonBuilder().startObject().startObject("_doc")

diff --git a/...sticsearch/xpack/analytics/mapper/TDigestPreAggregatedPercentileRanksAggregatorTests.java b/...sticsearch/xpack/analytics/mapper/TDigestPreAggregatedPercentileRanksAggregatorTests.java
@@ -44,8 +44,8 @@ private BinaryDocValuesField getDocValue(String fieldName, double[] values) thro
         Iterator<Centroid> iterator = centroids.iterator();
         while ( iterator.hasNext()) {
             Centroid centroid = iterator.next();
-            streamOutput.writeDouble(centroid.mean());
             streamOutput.writeVInt(centroid.count());
+            streamOutput.writeDouble(centroid.mean());
         }
         return new BinaryDocValuesField(fieldName, streamOutput.bytes().toBytesRef());
     }

diff --git a/.../elasticsearch/xpack/analytics/mapper/TDigestPreAggregatedPercentilesAggregatorTests.java b/.../elasticsearch/xpack/analytics/mapper/TDigestPreAggregatedPercentilesAggregatorTests.java
@@ -47,8 +47,8 @@ private BinaryDocValuesField getDocValue(String fieldName, double[] values) thro
        Iterator<Centroid> iterator = centroids.iterator();
        while ( iterator.hasNext()) {
            Centroid centroid = iterator.next();
-           streamOutput.writeDouble(centroid.mean());
            streamOutput.writeVInt(centroid.count());
+           streamOutput.writeDouble(centroid.mean());
        }
        return new BinaryDocValuesField(fieldName, streamOutput.bytes().toBytesRef());
    }