influxdata · danielnelson · Mar 2, 2020 · Feb 24, 2020 · Feb 24, 2020 · Feb 24, 2020
diff --git a/plugins/aggregators/histogram/README.md b/plugins/aggregators/histogram/README.md
@@ -3,8 +3,9 @@
 The histogram aggregator plugin creates histograms containing the counts of
 field values within a range.
 
-Values added to a bucket are also added to the larger buckets in the
-distribution.  This creates a [cumulative histogram](https://en.wikipedia.org/wiki/Histogram#/media/File:Cumulative_vs_normal_histogram.svg).
+If `cumulative` is set to true, values added to a bucket are also added to the
+larger buckets in the distribution. This creates a [cumulative histogram](https://en.wikipedia.org/wiki/Histogram#/media/File:Cumulative_vs_normal_histogram.svg).
+Otherwise, values are added to only one bucket, which creates an [ordinary histogram](https://en.wikipedia.org/wiki/Histogram#/media/File:Cumulative_vs_normal_histogram.svg)
 
 Like other Telegraf aggregators, the metric is emitted every `period` seconds.
 By default bucket counts are not reset between periods and will be non-strictly
@@ -16,7 +17,7 @@ increasing while Telegraf is running. This behavior can be changed by setting th
 Each metric is passed to the aggregator and this aggregator searches
 histogram buckets for those fields, which have been specified in the
 config. If buckets are found, the aggregator will increment +1 to the appropriate
-bucket otherwise it will be added to the `+Inf` bucket.  Every `period`
+bucket. Otherwise, it will be added to the `+Inf` bucket.  Every `period`
 seconds this data will be forwarded to the outputs.
 
 The algorithm of hit counting to buckets was implemented on the base
@@ -39,16 +40,20 @@ of the algorithm which is implemented in the Prometheus
   ## of accumulating the results.
   reset = false
 
+  ## Whether bucket values should be accumulated. If set to false, "gt" tag will be added.
+  ## Defaults to true.
+  cumulative = true
+
   ## Example config that aggregates all fields of the metric.
   # [[aggregators.histogram.config]]
-  #   ## The set of buckets.
+  #   ## Right borders of buckets (with +Inf implicitly added).
   #   buckets = [0.0, 15.6, 34.5, 49.1, 71.5, 80.5, 94.5, 100.0]
   #   ## The name of metric.
   #   measurement_name = "cpu"
 
   ## Example config that aggregates only specific fields of the metric.
   # [[aggregators.histogram.config]]
-  #   ## The set of buckets.
+  #   ## Right borders of buckets (with +Inf implicitly added).
   #   buckets = [0.0, 10.0, 20.0, 30.0, 40.0, 50.0, 60.0, 70.0, 80.0, 90.0, 100.0]
   #   ## The name of metric.
   #   measurement_name = "diskio"
@@ -64,8 +69,9 @@ option.  Optionally, if `fields` is set only the fields listed will be
 aggregated.  If `fields` is not set all fields are aggregated.
 
 The `buckets` option contains a list of floats which specify the bucket
-boundaries.  Each float value defines the inclusive upper bound of the bucket.
+boundaries.  Each float value defines the inclusive upper (right) bound of the bucket.
 The `+Inf` bucket is added automatically and does not need to be defined.
+(For left boundaries, these specified bucket borders and `-Inf` will be used).
 
 ### Measurements & Fields:
 
@@ -77,26 +83,43 @@ The postfix `bucket` will be added to each field key.
 
 ### Tags:
 
-All measurements are given the tag `le`. This tag has the border value of
-bucket. It means that the metric value is less than or equal to the value of
-this tag.  For example, let assume that we have the metric value 10 and the
-following buckets: [5, 10, 30, 70, 100]. Then the tag `le` will have the value
-10, because the metrics value is passed into bucket with right border value
-`10`.
+* `cumulative = true` (default):
+  * `le`: Right bucket border. It means that the metric value is less than or
+    equal to the value of this tag. If a metric value is sorted into a bucket,
+    it is also sorted into all larger buckets. As a result, the value of
+    `<field>_bucket` is rising with rising `le` value. When `le` is `+Inf`,
+    the bucket value is the count of all metrics, because all metric values are
+    less than or equal to positive infinity.
+* `cumulative = false`:
+  * `gt`: Left bucket border. It means that the metric value is greater than
+    (and not equal to) the value of this tag.
+  * `le`: Right bucket border. It means that the metric value is less than or
+    equal to the value of this tag.
+  * As both `gt` and `le` are present, each metric is sorted in only exactly
+    one bucket. 
+
 
 ### Example Output:
 
+Let assume we have the buckets [0, 10, 50, 100] and the following field values
+for `usage_idle`: [50, 7, 99, 12]
+
+With `cumulative = true`:
+
+```
+cpu,cpu=cpu1,host=localhost,le=0.0 usage_idle_bucket=0i 1486998330000000000  # none
+cpu,cpu=cpu1,host=localhost,le=10.0 usage_idle_bucket=1i 1486998330000000000  # 7
+cpu,cpu=cpu1,host=localhost,le=50.0 usage_idle_bucket=2i 1486998330000000000  # 7, 12
+cpu,cpu=cpu1,host=localhost,le=100.0 usage_idle_bucket=4i 1486998330000000000  # 7, 12, 50, 99
+cpu,cpu=cpu1,host=localhost,le=+Inf usage_idle_bucket=4i 1486998330000000000  # 7, 12, 50, 99
+```
+
+With `cumulative = false`:
+
 ```
-cpu,cpu=cpu1,host=localhost,le=0.0 usage_idle_bucket=0i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=10.0 usage_idle_bucket=0i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=20.0 usage_idle_bucket=1i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=30.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=40.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=50.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=60.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=70.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=80.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=90.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=100.0 usage_idle_bucket=2i 1486998330000000000
-cpu,cpu=cpu1,host=localhost,le=+Inf usage_idle_bucket=2i 1486998330000000000
+cpu,cpu=cpu1,host=localhost,gt=-Inf,le=0.0 usage_idle_bucket=0i 1486998330000000000  # none
+cpu,cpu=cpu1,host=localhost,gt=0.0,le=10.0 usage_idle_bucket=1i 1486998330000000000  # 7
+cpu,cpu=cpu1,host=localhost,gt=10.0,le=50.0 usage_idle_bucket=1i 1486998330000000000  # 12
+cpu,cpu=cpu1,host=localhost,gt=50.0,le=100.0 usage_idle_bucket=2i 1486998330000000000  # 50, 99
+cpu,cpu=cpu1,host=localhost,gt=100.0,le=+Inf usage_idle_bucket=0i 1486998330000000000  # none
 ```
diff --git a/plugins/aggregators/histogram/histogram.go b/plugins/aggregators/histogram/histogram.go
@@ -8,16 +8,23 @@ import (
 	"github.com/influxdata/telegraf/plugins/aggregators"
 )
 
-// bucketTag is the tag, which contains right bucket border
-const bucketTag = "le"
+// bucketRightTag is the tag, which contains right bucket border
+const bucketRightTag = "le"
 
-// bucketInf is the right bucket border for infinite values
-const bucketInf = "+Inf"
+// bucketPosInf is the right bucket border for infinite values
+const bucketPosInf = "+Inf"
+
+// bucketLeftTag is the tag, which contains left bucket border (exclusive)
+const bucketLeftTag = "gt"
+
+// bucketNegInf is the left bucket border for infinite values
+const bucketNegInf = "-Inf"
 
 // HistogramAggregator is aggregator with histogram configs and particular histograms for defined metrics
 type HistogramAggregator struct {
 	Configs      []config `toml:"config"`
 	ResetBuckets bool     `toml:"reset"`
+	Cumulative   bool     `toml:"cumulative"`
 
 	buckets bucketsByMetrics
 	cache   map[uint64]metricHistogramCollection
@@ -57,8 +64,10 @@ type groupedByCountFields struct {
 }
 
 // NewHistogramAggregator creates new histogram aggregator
-func NewHistogramAggregator() telegraf.Aggregator {
-	h := &HistogramAggregator{}
+func NewHistogramAggregator() *HistogramAggregator {
+	h := &HistogramAggregator{
+		Cumulative: true,
+	}
 	h.buckets = make(bucketsByMetrics)
 	h.resetCache()
 
@@ -77,16 +86,20 @@ var sampleConfig = `
   ## of accumulating the results.
   reset = false
 
+  ## Whether bucket values should be accumulated. If set to false, "gt" tag will be added.
+  ## Defaults to true.
+  cumulative = true
+
   ## Example config that aggregates all fields of the metric.
   # [[aggregators.histogram.config]]
-  #   ## The set of buckets.
+  #   ## Right borders of buckets (with +Inf implicitly added).
   #   buckets = [0.0, 15.6, 34.5, 49.1, 71.5, 80.5, 94.5, 100.0]
   #   ## The name of metric.
   #   measurement_name = "cpu"
 
   ## Example config that aggregates only specific fields of the metric.
   # [[aggregators.histogram.config]]
-  #   ## The set of buckets.
+  #   ## Right borders of buckets (with +Inf implicitly added).
   #   buckets = [0.0, 10.0, 20.0, 30.0, 40.0, 50.0, 60.0, 70.0, 80.0, 90.0, 100.0]
   #   ## The name of metric.
   #   measurement_name = "diskio"
@@ -167,18 +180,35 @@ func (h *HistogramAggregator) groupFieldsByBuckets(
 	tags map[string]string,
 	counts []int64,
 ) {
-	count := int64(0)
-	for index, bucket := range h.getBuckets(name, field) {
-		count += counts[index]
+	if h.Cumulative {
+		count := int64(0)
+		for index, bucket := range h.getBuckets(name, field) {
+			count += counts[index]
 
-		tags[bucketTag] = strconv.FormatFloat(bucket, 'f', -1, 64)
-		h.groupField(metricsWithGroupedFields, name, field, count, copyTags(tags))
-	}
+			tags[bucketRightTag] = strconv.FormatFloat(bucket, 'f', -1, 64)
+			h.groupField(metricsWithGroupedFields, name, field, count, copyTags(tags))
+		}
 
-	count += counts[len(counts)-1]
-	tags[bucketTag] = bucketInf
+		count += counts[len(counts)-1]
+		tags[bucketRightTag] = bucketPosInf
 
-	h.groupField(metricsWithGroupedFields, name, field, count, tags)
+		h.groupField(metricsWithGroupedFields, name, field, count, tags)
+	} else {
+		buckets := h.getBuckets(name, field)
+		for index, count := range counts {
+			tags[bucketLeftTag] = bucketNegInf
+			if index > 0 {
+				tags[bucketLeftTag] = strconv.FormatFloat(buckets[index-1], 'f', -1, 64)
+			}
+
+			tags[bucketRightTag] = bucketPosInf
+			if index < len(buckets) {
+				tags[bucketRightTag] = strconv.FormatFloat(buckets[index], 'f', -1, 64)
+			}
+
+			h.groupField(metricsWithGroupedFields, name, field, count, copyTags(tags))
+		}
+	}
 }
 
 // groupField groups field by count value