diff --git a/confluent_platform/changelog.d/17490.fixed b/confluent_platform/changelog.d/17490.fixed new file mode 100644 index 0000000000000..d6b30db29af0a --- /dev/null +++ b/confluent_platform/changelog.d/17490.fixed @@ -0,0 +1,2 @@ + +Add a Bean regex for stream thread metrics for Confluent version >=5.5.0. Previously, Stream Thread Metrics were not collected. Also added one useful attribute for debugging stream thread performance. \ No newline at end of file diff --git a/confluent_platform/datadog_checks/confluent_platform/data/metrics.yaml b/confluent_platform/datadog_checks/confluent_platform/data/metrics.yaml index 8c5bcc4eab4ec..7133eb3fe3ed4 100644 --- a/confluent_platform/datadog_checks/confluent_platform/data/metrics.yaml +++ b/confluent_platform/datadog_checks/confluent_platform/data/metrics.yaml @@ -1600,7 +1600,107 @@ jmx_metrics: # Components Metrics: - # - Confluent Streams Thread: https://docs.confluent.io/current/streams/monitoring.html#built-in-metrics + # - Confluent Streams Thread: https://docs.confluent.io/current/streams/monitoring.html#thread-metrics + - include: + domain: kafka.streams + bean_regex: kafka\.streams:type=stream-thread-metrics,thread-id=.* + attribute: + blocked-time-ns-total: + # The total time the Kafka Streams thread spent blocked on Kafka since it was started, in nanoseconds (ns). + alias: confluent.$domain.stream.$attribute + metric_type: gauge + commit-latency-avg: + # The average value of commit-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + commit-latency-max: + # The maximum value of commit-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + commit-rate: + # The average per-second number of commit calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + commit-total: + # The total number of commit calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + poll-latency-avg: + # The average value of poll-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + poll-latency-max: + # The maximum value of poll-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + poll-rate: + # The average per-second number of poll calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + poll-total: + # The total number of poll calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + process-latency-avg: + # The average value of process-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + process-latency-max: + # The maximum value of process-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + process-rate: + # The average per-second number of process calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + process-total: + # The total number of process calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + punctuate-latency-avg: + # The average value of punctuate-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + punctuate-latency-max: + # The maximum value of punctuate-latency. + alias: confluent.$domain.stream.$attribute + metric_type: gauge + punctuate-rate: + # The average per-second number of punctuate calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + punctuate-total: + # The total number of punctuate calls + alias: confluent.$domain.stream.$attribute + metric_type: gauge + skipped-records-rate: + # The average per-second number of skipped records + alias: confluent.$domain.stream.$attribute + metric_type: gauge + skipped-records-total: + # The total number of skipped records + alias: confluent.$domain.stream.$attribute + metric_type: gauge + task-closed-rate: + # The average per-second number of closed tasks + alias: confluent.$domain.stream.$attribute + metric_type: gauge + task-closed-total: + # The total number of closed tasks + alias: confluent.$domain.stream.$attribute + metric_type: gauge + task-created-rate: + # The average per-second number of newly created tasks + alias: confluent.$domain.stream.$attribute + metric_type: gauge + task-created-total: + # The total number of newly created tasks + alias: confluent.$domain.stream.$attribute + metric_type: gauge + + # Components Metrics: + # - Confluent Streams Thread: https://docs.confluent.io/legacy/platform/5.4.10/streams/monitoring.html#built-in-metrics + # For backwards compatibility with at least version 5.4.10 of confluent platform - include: domain: kafka.streams bean_regex: kafka\.streams:type=stream-metrics,client-id=.*