aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorStaffan Olsson <staffan@repos.se>2018-02-02 12:33:27 +0100
committerStaffan Olsson <staffan@repos.se>2018-02-03 14:25:33 +0100
commit152bb19a7cdd448941e07c3a7c23e5a16f9c6b56 (patch)
tree61b3f047c2925f62f0c30ac28661608e0bc97ccc
parentcfe434c55bc44d53ff6a569fa480ef4d92bd1144 (diff)
downloadkubernetes-kafka-152bb19a7cdd448941e07c3a7c23e5a16f9c6b56.tar.gz
kubernetes-kafka-152bb19a7cdd448941e07c3a7c23e5a16f9c6b56.tar.bz2
kubernetes-kafka-152bb19a7cdd448941e07c3a7c23e5a16f9c6b56.zip
”In a production Kafka cluster, an offline partition
may be impacting the producer clients, losing messages or causing back-pressure in the application. This is most often a “site down” type of problem and will need to be addressed immediately.” Excerpt from: Neha Narkhede, Gwen Shapira, and Todd Palino. ”Kafka: The Definitive Guide”. We now export kafka_controller_kafkacontroller_value{name="OfflinePartitionsCount",} and friends. See #140 for why.
-rw-r--r--prometheus/10-metrics-config.yml3
1 files changed, 2 insertions, 1 deletions
diff --git a/prometheus/10-metrics-config.yml b/prometheus/10-metrics-config.yml
index 4416cce..33bed50 100644
--- a/prometheus/10-metrics-config.yml
+++ b/prometheus/10-metrics-config.yml
@@ -9,8 +9,9 @@ data:
lowercaseOutputName: true
jmxUrl: service:jmx:rmi:///jndi/rmi://127.0.0.1:5555/jmxrmi
ssl: false
- whitelistObjectNames: ["kafka.server:*","java.lang:*"]
+ whitelistObjectNames: ["kafka.controller:*","kafka.server:*","java.lang:*"]
rules:
+ - pattern : kafka.controller<type=KafkaController, name=(.+)><>(.*)
- pattern : kafka.server<type=ReplicaFetcherManager, name=MaxLag, clientId=(.+)><>Value
- pattern : kafka.server<type=BrokerTopicMetrics, name=(BytesInPerSec|BytesOutPerSec|MessagesInPerSec), topic=(.+)><>OneMinuteRate
- pattern : kafka.server<type=KafkaRequestHandlerPool, name=RequestHandlerAvgIdlePercent><>OneMinuteRate