Skip to content

Commit

Permalink
Multiple duration fields for better elasticseach storage for controll…
Browse files Browse the repository at this point in the history
…ermanager (#32486)

* Multiple duration fields for better elasticseach storage

* Update controllermanager dashboard
  • Loading branch information
MichaelKatsoulis authored Jul 26, 2022
1 parent c580fdb commit 284d2d9
Show file tree
Hide file tree
Showing 9 changed files with 5,235 additions and 7,242 deletions.
35 changes: 4 additions & 31 deletions metricbeat/docs/fields.asciidoc
Original file line number Diff line number Diff line change
Expand Up @@ -43502,7 +43502,7 @@ type: long

--

*`kubernetes.controllermanager.client.request.duration.sec.bucket.*`*::
*`kubernetes.controllermanager.client.request.duration.us.bucket.*`*::
+
--
Response latency distribution, histogram buckets
Expand All @@ -43511,16 +43511,16 @@ type: object

--

*`kubernetes.controllermanager.client.request.duration.sec.sum`*::
*`kubernetes.controllermanager.client.request.duration.us.sum`*::
+
--
Request duration, sum in seconds
Request duration, sum in microseconds

type: long

--

*`kubernetes.controllermanager.client.request.duration.sec.count`*::
*`kubernetes.controllermanager.client.request.duration.us.count`*::
+
--
Request duration, number of operations
Expand Down Expand Up @@ -43575,33 +43575,6 @@ type: long

--

*`kubernetes.controllermanager.workqueue.work.duration.sec.sum`*::
+
--
Processing time of workqueue item, sum in seconds

type: long

--

*`kubernetes.controllermanager.workqueue.work.duration.sec.count`*::
+
--
Processing time of workqueue item, number of operations

type: long

--

*`kubernetes.controllermanager.workqueue.work.duration.sec.bucket.*`*::
+
--
Processing time of workqueue item, histogram buckets

type: object

--


*`kubernetes.controllermanager.node.collector.eviction.count`*::
+
Expand Down

Large diffs are not rendered by default.

Original file line number Diff line number Diff line change
@@ -0,0 +1,190 @@
{
"attributes": {
"description": "",
"kibanaSavedObjectMeta": {
"searchSourceJSON": {
"filter": [],
"query": {
"language": "kuery",
"query": ""
}
}
},
"title": "Controller Process [Metricbeat Kubernetes]",
"uiStateJSON": {},
"version": 1,
"visState": {
"aggs": [],
"params": {
"axis_formatter": "number",
"axis_position": "left",
"axis_scale": "normal",
"drop_last_bucket": 1,
"hide_last_value_indicator": true,
"id": "61ca57f0-469d-11e7-af02-69e470af7417",
"index_pattern": "metricbeat-*",
"interval": "30s",
"isModelInvalid": false,
"markdown": "| | |\n|---|---|\n|**Days running**|{{ math.started.last.raw }}|\n|**File descriptors open**|{{ average_of_kubernetes_controllermanager_process_fds_open_count.fds.last.formatted }}|\n|**Maximun File descriptors**|{{ max_of_kubernetes_controllermanager_process_fds_max_count.fds_max.last.formatted }}|\n|**Resident Memory**|{{ average_of_kubernetes_controllermanager_process_memory_resident_bytes.resident_memory.last.formatted }}|\n|**Virtual Memory**|{{ average_of_kubernetes_controllermanager_process_memory_virtual_bytes.virtual_memory.last.formatted }}|\n",
"markdown_css": "table, tr, td, th{border:none}",
"max_lines_legend": 1,
"series": [
{
"axis_position": "right",
"chart_type": "line",
"color": "#68BC00",
"fill": 0.5,
"formatter": "number",
"id": "61ca57f1-469d-11e7-af02-69e470af7417",
"line_width": 1,
"metrics": [
{
"field": "kubernetes.controllermanager.process.started.sec",
"id": "61ca57f2-469d-11e7-af02-69e470af7417",
"type": "max"
},
{
"id": "ebfdb1c0-9c1c-11e9-b29f-d55be9348723",
"script": "round( (params._timestamp /1000 - params.started) / 86400, 2)",
"type": "math",
"variables": [
{
"field": "61ca57f2-469d-11e7-af02-69e470af7417",
"id": "ef30a230-9c1c-11e9-b29f-d55be9348723",
"name": "started"
}
]
}
],
"point_size": 1,
"separate_axis": 0,
"split_color_mode": "gradient",
"split_mode": "everything",
"stacked": "none",
"time_range_mode": "entire_time_range",
"var_name": "started"
},
{
"axis_position": "right",
"chart_type": "line",
"color": "#68BC00",
"fill": 0.5,
"formatter": "number",
"id": "1212ba80-9c1e-11e9-b29f-d55be9348723",
"label": "",
"line_width": 1,
"metrics": [
{
"field": "kubernetes.controllermanager.process.fds.open.count",
"id": "1212ba81-9c1e-11e9-b29f-d55be9348723",
"type": "avg"
}
],
"point_size": 1,
"separate_axis": 0,
"split_color_mode": "gradient",
"split_mode": "everything",
"stacked": "none",
"time_range_mode": "entire_time_range",
"var_name": "fds"
},
{
"axis_position": "right",
"chart_type": "line",
"color": "#68BC00",
"fill": 0.5,
"formatter": "bytes",
"id": "3f3b17a0-9c1e-11e9-b29f-d55be9348723",
"label": "",
"line_width": 1,
"metrics": [
{
"field": "kubernetes.controllermanager.process.memory.resident.bytes",
"id": "3f3b17a1-9c1e-11e9-b29f-d55be9348723",
"type": "avg"
}
],
"point_size": 1,
"separate_axis": 0,
"split_color_mode": "gradient",
"split_mode": "everything",
"stacked": "none",
"time_range_mode": "entire_time_range",
"var_name": "resident_memory"
},
{
"axis_position": "right",
"chart_type": "line",
"color": "#68BC00",
"fill": 0.5,
"formatter": "bytes",
"id": "b1a01b50-9c1f-11e9-b29f-d55be9348723",
"line_width": 1,
"metrics": [
{
"field": "kubernetes.controllermanager.process.memory.virtual.bytes",
"id": "b1a01b51-9c1f-11e9-b29f-d55be9348723",
"type": "avg"
}
],
"point_size": 1,
"separate_axis": 0,
"split_color_mode": "gradient",
"split_mode": "everything",
"stacked": "none",
"time_range_mode": "entire_time_range",
"var_name": "virtual_memory"
},
{
"axis_position": "right",
"chart_type": "line",
"color": "#68BC00",
"fill": 0.5,
"formatter": "number",
"id": "6faac700-f2dd-11ec-ab74-4342b85d7779",
"label": "",
"line_width": 1,
"metrics": [
{
"field": "kubernetes.controllermanager.process.fds.max.count",
"id": "6faaee10-f2dd-11ec-ab74-4342b85d7779",
"type": "max"
}
],
"override_index_pattern": 0,
"palette": {
"name": "default",
"type": "palette"
},
"point_size": 1,
"separate_axis": 0,
"series_drop_last_bucket": 0,
"split_mode": "everything",
"stacked": "none",
"time_range_mode": "entire_time_range",
"var_name": "fds_max"
}
],
"show_grid": 1,
"show_legend": 1,
"time_field": "@timestamp",
"time_range_mode": "last_value",
"tooltip_mode": "show_all",
"truncate_legend": 1,
"type": "markdown",
"use_kibana_indexes": false
},
"title": "Controller Process [Metricbeat Kubernetes]",
"type": "metrics"
}
},
"coreMigrationVersion": "8.4.0",
"id": "2d866300-0cb1-11ed-b5e5-a774dc3eeaba",
"migrationVersion": {
"visualization": "8.3.0"
},
"references": [],
"type": "visualization",
"updated_at": "2022-07-26T07:04:23.093Z",
"version": "WzEzNzksMV0="
}
41 changes: 17 additions & 24 deletions metricbeat/module/kubernetes/controllermanager/_meta/data.json
Original file line number Diff line number Diff line change
Expand Up @@ -7,31 +7,24 @@
},
"kubernetes": {
"controllermanager": {
"client": {
"request": {
"duration": {
"sec": {
"bucket": {
"+Inf": 1,
"0.001": 0,
"0.002": 0,
"0.004": 0,
"0.008": 0,
"0.016": 1,
"0.032": 1,
"0.064": 1,
"0.128": 1,
"0.256": 1,
"0.512": 1
},
"count": 1,
"sum": 0.008447322
}
}
"name": "serviceaccount",
"workqueue": {
"adds": {
"count": 5
},
"depth": {
"count": 0
},
"longestrunning": {
"sec": 0
},
"retries": {
"count": 0
},
"unfinished": {
"sec": 0
}
},
"url": "https://172.18.0.2:6443/api/v1/configmaps?limit=%7Bvalue%7D\u0026resourceVersion=%7Bvalue%7D",
"verb": "GET"
}
}
},
"metricset": {
Expand Down
18 changes: 4 additions & 14 deletions metricbeat/module/kubernetes/controllermanager/_meta/fields.yml
Original file line number Diff line number Diff line change
Expand Up @@ -62,14 +62,14 @@
type: long
description: >
Number of requests as client
- name: request.duration.sec.bucket.*
- name: request.duration.us.bucket.*
type: object
object_type: long
description: Response latency distribution, histogram buckets
- name: request.duration.sec.sum
- name: request.duration.us.sum
type: long
description: Request duration, sum in seconds
- name: request.duration.sec.count
description: Request duration, sum in microseconds
- name: request.duration.us.count
type: long
description: Request duration, number of operations
- name: workqueue
Expand All @@ -90,16 +90,6 @@
- name: retries.count
type: long
description: Workqueue number of retries
- name: work.duration.sec.sum
type: long
description: Processing time of workqueue item, sum in seconds
- name: work.duration.sec.count
type: long
description: Processing time of workqueue item, number of operations
- name: work.duration.sec.bucket.*
type: object
object_type: long
description: Processing time of workqueue item, histogram buckets
- name: node.collector
type: group
fields:
Expand Down
Loading

0 comments on commit 284d2d9

Please sign in to comment.