Skip to content

Commit e942112

Browse files
committed
Update Telemeter metrics allow-list
Signed-off-by: Simon Pasquier <[email protected]>
1 parent 62555bd commit e942112

File tree

3 files changed

+42
-7
lines changed

3 files changed

+42
-7
lines changed

Diff for: Makefile

+3-1
Original file line numberDiff line numberDiff line change
@@ -107,7 +107,9 @@ resources/observability/grafana/observatorium-logs: format observability/grafana
107107
$(JSONNET) -J "$(JSONNET_VENDOR_DIR)" -m resources/observability/grafana/observatorium-logs observability/grafana-obs-logs.jsonnet | $(XARGS) -I{} sh -c 'cat {} | $(GOJSONTOYAML) > {}.yaml' -- {}
108108

109109
.PHONY: whitelisted_metrics
110-
whitelisted_metrics: $(GOJSONTOYAML) $(GOJQ)
110+
whitelisted_metrics: $(GOJSONTOYAML) $(GOJQ) configuration/telemeter/metrics.json resources/services/telemeter-template.yaml
111+
112+
configuration/telemeter/metrics.json:
111113
@echo ">>>>> Running whitelisted_metrics"
112114
# Download the latest metrics file to extract the new added metrics.
113115
# NOTE: Because old clusters could still send metrics the whitelisting is append only

Diff for: configuration/telemeter/metrics.json

+13-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
[
22
"{__name__=\":apiserver_v1_image_imports:sum\"}",
3+
"{__name__=\"ALERTS\",alertstate=\"firing\",severity=~\"critical|warning|info|none\"}",
34
"{__name__=\"ALERTS\",alertstate=\"firing\"}",
45
"{__name__=\"acm_console_page_count:sum\", page=~\"overview-classic|overview-fleet|search|search-details|clusters|application|governance\"}",
56
"{__name__=\"acm_managed_cluster_info\"}",
@@ -73,6 +74,8 @@
7374
"{__name__=\"cluster_installer\"}",
7475
"{__name__=\"cluster_legacy_scheduler_policy\"}",
7576
"{__name__=\"cluster_master_schedulable\"}",
77+
"{__name__=\"cluster_name:hypershift_nodepools_available_replicas:sum\"}",
78+
"{__name__=\"cluster_name:hypershift_nodepools_size:sum\"}",
7679
"{__name__=\"cluster_operator_conditions\"}",
7780
"{__name__=\"cluster_operator_up\"}",
7881
"{__name__=\"cluster_version\"}",
@@ -88,6 +91,7 @@
8891
"{__name__=\"count:up1\"}",
8992
"{__name__=\"csv_abnormal\"}",
9093
"{__name__=\"csv_succeeded\"}",
94+
"{__name__=\"enabled:tempo_operator_tempostack_jaeger_ui:sum\",enabled=\"true|false\"}",
9195
"{__name__=\"eo_es_cluster_management_state_info\"}",
9296
"{__name__=\"eo_es_defined_delete_namespaces_total\"}",
9397
"{__name__=\"eo_es_misconfigured_memory_resources_info\"}",
@@ -164,8 +168,6 @@
164168
"{__name__=\"os_image_url_override:sum\"}",
165169
"{__name__=\"platform:hypershift_hostedclusters:max\"}",
166170
"{__name__=\"platform:hypershift_nodepools:max\"}",
167-
"{__name__=\"cluster_name:hypershift_nodepools_size:sum\"}",
168-
"{__name__=\"cluster_name:hypershift_nodepools_available_replicas:sum\"}",
169171
"{__name__=\"pod:eo_es_shards_total:max\"}",
170172
"{__name__=\"profile:cluster_monitoring_operator_collection_profile:max\"}",
171173
"{__name__=\"rhacs:telemetry:rox_central_info\"}",
@@ -180,8 +182,17 @@
180182
"{__name__=\"rhods_total_users\"}",
181183
"{__name__=\"state:rhoam_critical_alerts:max\"}",
182184
"{__name__=\"state:rhoam_warning_alerts:max\"}",
185+
"{__name__=\"state:tempo_operator_tempostack_managed:sum\",state=~\"Managed|Unmanaged\"}",
183186
"{__name__=\"status:upgrading:version:rhoam_state:max\"}",
184187
"{__name__=\"subscription_sync_total\"}",
188+
"{__name__=\"type:opentelemetry_collector_connectors:sum\",type=\"spanmetricsconnector|forwardconnector\"}",
189+
"{__name__=\"type:opentelemetry_collector_exporters:sum\",type=\"debugexporter|loggingexporter|otlpexporter|otlphttpexporter|prometheusexporter|lokiexporter|kafkaexporter|awscloudwatchlogsexporter|loadbalancingexporter\"}",
190+
"{__name__=\"type:opentelemetry_collector_extensions:sum\",type=\"zpagesextension|ballastextension|memorylimiterextension|jaegerremotesampling|healthcheckextension|pprofextension|oauth2clientauthextension|oidcauthextension|bearertokenauthextension|filestorage\"}",
191+
"{__name__=\"type:opentelemetry_collector_info:sum\",type=\"deployment|daemonset|sidecar|statefulset\"}",
192+
"{__name__=\"type:opentelemetry_collector_processors:sum\",type=\"batchprocessor|memorylimiterprocessor|attributesprocessor|resourceprocessor|spanprocessor|k8sattributesprocessor|resourcedetectionprocessor|filterprocessor|routingprocessor|cumulativetodeltaprocessor|groupbyattrsprocessor\"}",
193+
"{__name__=\"type:opentelemetry_collector_receivers:sum\",type=\"jaegerreceiver|hostmetricsreceiver|opencensusreceiver|prometheusreceiver|zipkinreceiver|kafkareceiver|filelogreceiver|journaldreceiver|k8seventsreceiver|kubeletstatsreceiver|k8sclusterreceiver|k8sobjectsreceiver\"}",
194+
"{__name__=\"type:tempo_operator_tempostack_multi_tenancy:sum\",type=~\"enabled|disabled\"}",
195+
"{__name__=\"type:tempo_operator_tempostack_storage_backend:sum\",type=~\"azure|gcs|s3\"}",
185196
"{__name__=\"up\"}",
186197
"{__name__=\"visual_web_terminal_sessions_total\"}",
187198
"{__name__=\"workload:cpu_usage_cores:sum\"}",

Diff for: resources/services/telemeter-template.yaml

+26-4
Original file line numberDiff line numberDiff line change
@@ -94,6 +94,7 @@ objects:
9494
- --memcached=memcached-1.memcached.${NAMESPACE}.svc.cluster.local:11211
9595
- --memcached=memcached-2.memcached.${NAMESPACE}.svc.cluster.local:11211
9696
- --whitelist={__name__=":apiserver_v1_image_imports:sum"}
97+
- --whitelist={__name__="alerts",alertstate="firing",severity=~"critical|warning|info|none"}
9798
- --whitelist={__name__="alerts",alertstate="firing"}
9899
- --whitelist={__name__="acm_console_page_count:sum", page=~"overview-classic|overview-fleet|search|search-details|clusters|application|governance"}
99100
- --whitelist={__name__="acm_managed_cluster_info"}
@@ -167,6 +168,8 @@ objects:
167168
- --whitelist={__name__="cluster_installer"}
168169
- --whitelist={__name__="cluster_legacy_scheduler_policy"}
169170
- --whitelist={__name__="cluster_master_schedulable"}
171+
- --whitelist={__name__="cluster_name:hypershift_nodepools_available_replicas:sum"}
172+
- --whitelist={__name__="cluster_name:hypershift_nodepools_size:sum"}
170173
- --whitelist={__name__="cluster_operator_conditions"}
171174
- --whitelist={__name__="cluster_operator_up"}
172175
- --whitelist={__name__="cluster_version"}
@@ -182,6 +185,7 @@ objects:
182185
- --whitelist={__name__="count:up1"}
183186
- --whitelist={__name__="csv_abnormal"}
184187
- --whitelist={__name__="csv_succeeded"}
188+
- --whitelist={__name__="enabled:tempo_operator_tempostack_jaeger_ui:sum",enabled="true|false"}
185189
- --whitelist={__name__="eo_es_cluster_management_state_info"}
186190
- --whitelist={__name__="eo_es_defined_delete_namespaces_total"}
187191
- --whitelist={__name__="eo_es_misconfigured_memory_resources_info"}
@@ -258,8 +262,6 @@ objects:
258262
- --whitelist={__name__="os_image_url_override:sum"}
259263
- --whitelist={__name__="platform:hypershift_hostedclusters:max"}
260264
- --whitelist={__name__="platform:hypershift_nodepools:max"}
261-
- --whitelist={__name__="cluster_name:hypershift_nodepools_size:sum"}
262-
- --whitelist={__name__="cluster_name:hypershift_nodepools_available_replicas:sum"}
263265
- --whitelist={__name__="pod:eo_es_shards_total:max"}
264266
- --whitelist={__name__="profile:cluster_monitoring_operator_collection_profile:max"}
265267
- --whitelist={__name__="rhacs:telemetry:rox_central_info"}
@@ -274,8 +276,17 @@ objects:
274276
- --whitelist={__name__="rhods_total_users"}
275277
- --whitelist={__name__="state:rhoam_critical_alerts:max"}
276278
- --whitelist={__name__="state:rhoam_warning_alerts:max"}
279+
- --whitelist={__name__="state:tempo_operator_tempostack_managed:sum",state=~"Managed|Unmanaged"}
277280
- --whitelist={__name__="status:upgrading:version:rhoam_state:max"}
278281
- --whitelist={__name__="subscription_sync_total"}
282+
- --whitelist={__name__="type:opentelemetry_collector_connectors:sum",type="spanmetricsconnector|forwardconnector"}
283+
- --whitelist={__name__="type:opentelemetry_collector_exporters:sum",type="debugexporter|loggingexporter|otlpexporter|otlphttpexporter|prometheusexporter|lokiexporter|kafkaexporter|awscloudwatchlogsexporter|loadbalancingexporter"}
284+
- --whitelist={__name__="type:opentelemetry_collector_extensions:sum",type="zpagesextension|ballastextension|memorylimiterextension|jaegerremotesampling|healthcheckextension|pprofextension|oauth2clientauthextension|oidcauthextension|bearertokenauthextension|filestorage"}
285+
- --whitelist={__name__="type:opentelemetry_collector_info:sum",type="deployment|daemonset|sidecar|statefulset"}
286+
- --whitelist={__name__="type:opentelemetry_collector_processors:sum",type="batchprocessor|memorylimiterprocessor|attributesprocessor|resourceprocessor|spanprocessor|k8sattributesprocessor|resourcedetectionprocessor|filterprocessor|routingprocessor|cumulativetodeltaprocessor|groupbyattrsprocessor"}
287+
- --whitelist={__name__="type:opentelemetry_collector_receivers:sum",type="jaegerreceiver|hostmetricsreceiver|opencensusreceiver|prometheusreceiver|zipkinreceiver|kafkareceiver|filelogreceiver|journaldreceiver|k8seventsreceiver|kubeletstatsreceiver|k8sclusterreceiver|k8sobjectsreceiver"}
288+
- --whitelist={__name__="type:tempo_operator_tempostack_multi_tenancy:sum",type=~"enabled|disabled"}
289+
- --whitelist={__name__="type:tempo_operator_tempostack_storage_backend:sum",type=~"azure|gcs|s3"}
279290
- --whitelist={__name__="up"}
280291
- --whitelist={__name__="visual_web_terminal_sessions_total"}
281292
- --whitelist={__name__="workload:cpu_usage_cores:sum"}
@@ -379,6 +390,7 @@ objects:
379390
- --memcached=memcached-1.memcached.${NAMESPACE}.svc.cluster.local:11211
380391
- --memcached=memcached-2.memcached.${NAMESPACE}.svc.cluster.local:11211
381392
- --whitelist={__name__=":apiserver_v1_image_imports:sum"}
393+
- --whitelist={__name__="alerts",alertstate="firing",severity=~"critical|warning|info|none"}
382394
- --whitelist={__name__="alerts",alertstate="firing"}
383395
- --whitelist={__name__="acm_console_page_count:sum", page=~"overview-classic|overview-fleet|search|search-details|clusters|application|governance"}
384396
- --whitelist={__name__="acm_managed_cluster_info"}
@@ -452,6 +464,8 @@ objects:
452464
- --whitelist={__name__="cluster_installer"}
453465
- --whitelist={__name__="cluster_legacy_scheduler_policy"}
454466
- --whitelist={__name__="cluster_master_schedulable"}
467+
- --whitelist={__name__="cluster_name:hypershift_nodepools_available_replicas:sum"}
468+
- --whitelist={__name__="cluster_name:hypershift_nodepools_size:sum"}
455469
- --whitelist={__name__="cluster_operator_conditions"}
456470
- --whitelist={__name__="cluster_operator_up"}
457471
- --whitelist={__name__="cluster_version"}
@@ -467,6 +481,7 @@ objects:
467481
- --whitelist={__name__="count:up1"}
468482
- --whitelist={__name__="csv_abnormal"}
469483
- --whitelist={__name__="csv_succeeded"}
484+
- --whitelist={__name__="enabled:tempo_operator_tempostack_jaeger_ui:sum",enabled="true|false"}
470485
- --whitelist={__name__="eo_es_cluster_management_state_info"}
471486
- --whitelist={__name__="eo_es_defined_delete_namespaces_total"}
472487
- --whitelist={__name__="eo_es_misconfigured_memory_resources_info"}
@@ -543,8 +558,6 @@ objects:
543558
- --whitelist={__name__="os_image_url_override:sum"}
544559
- --whitelist={__name__="platform:hypershift_hostedclusters:max"}
545560
- --whitelist={__name__="platform:hypershift_nodepools:max"}
546-
- --whitelist={__name__="cluster_name:hypershift_nodepools_size:sum"}
547-
- --whitelist={__name__="cluster_name:hypershift_nodepools_available_replicas:sum"}
548561
- --whitelist={__name__="pod:eo_es_shards_total:max"}
549562
- --whitelist={__name__="profile:cluster_monitoring_operator_collection_profile:max"}
550563
- --whitelist={__name__="rhacs:telemetry:rox_central_info"}
@@ -559,8 +572,17 @@ objects:
559572
- --whitelist={__name__="rhods_total_users"}
560573
- --whitelist={__name__="state:rhoam_critical_alerts:max"}
561574
- --whitelist={__name__="state:rhoam_warning_alerts:max"}
575+
- --whitelist={__name__="state:tempo_operator_tempostack_managed:sum",state=~"Managed|Unmanaged"}
562576
- --whitelist={__name__="status:upgrading:version:rhoam_state:max"}
563577
- --whitelist={__name__="subscription_sync_total"}
578+
- --whitelist={__name__="type:opentelemetry_collector_connectors:sum",type="spanmetricsconnector|forwardconnector"}
579+
- --whitelist={__name__="type:opentelemetry_collector_exporters:sum",type="debugexporter|loggingexporter|otlpexporter|otlphttpexporter|prometheusexporter|lokiexporter|kafkaexporter|awscloudwatchlogsexporter|loadbalancingexporter"}
580+
- --whitelist={__name__="type:opentelemetry_collector_extensions:sum",type="zpagesextension|ballastextension|memorylimiterextension|jaegerremotesampling|healthcheckextension|pprofextension|oauth2clientauthextension|oidcauthextension|bearertokenauthextension|filestorage"}
581+
- --whitelist={__name__="type:opentelemetry_collector_info:sum",type="deployment|daemonset|sidecar|statefulset"}
582+
- --whitelist={__name__="type:opentelemetry_collector_processors:sum",type="batchprocessor|memorylimiterprocessor|attributesprocessor|resourceprocessor|spanprocessor|k8sattributesprocessor|resourcedetectionprocessor|filterprocessor|routingprocessor|cumulativetodeltaprocessor|groupbyattrsprocessor"}
583+
- --whitelist={__name__="type:opentelemetry_collector_receivers:sum",type="jaegerreceiver|hostmetricsreceiver|opencensusreceiver|prometheusreceiver|zipkinreceiver|kafkareceiver|filelogreceiver|journaldreceiver|k8seventsreceiver|kubeletstatsreceiver|k8sclusterreceiver|k8sobjectsreceiver"}
584+
- --whitelist={__name__="type:tempo_operator_tempostack_multi_tenancy:sum",type=~"enabled|disabled"}
585+
- --whitelist={__name__="type:tempo_operator_tempostack_storage_backend:sum",type=~"azure|gcs|s3"}
564586
- --whitelist={__name__="up"}
565587
- --whitelist={__name__="visual_web_terminal_sessions_total"}
566588
- --whitelist={__name__="workload:cpu_usage_cores:sum"}

0 commit comments

Comments
 (0)