diff --git a/README.md b/README.md index 68bb4e4..215ea82 100644 --- a/README.md +++ b/README.md @@ -4,7 +4,30 @@ Configurable general purpose Prometheus exporter for MQTT. Subscribes to one or more MQTT topics, and lets you configure prometheus metrics based on pattern matching. -[![Test with pytest](https://github.com/fhemberger/mqtt_exporter/actions/workflows/test.yml/badge.svg)](https://github.com/fhemberger/mqtt_exporter/actions/workflows/test.yml)[![CodeQL](https://github.com/fhemberger/mqtt_exporter/actions/workflows/codeql-analysis.yml/badge.svg)](https://github.com/fhemberger/mqtt_exporter/actions/workflows/codeql-analysis.yml) +[![Test with pytest](https://github.com/fhemberger/mqtt_exporter/actions/workflows/test.yml/badge.svg)](https://github.com/fhemberger/mqtt_exporter/actions/workflows/test.yml)[![CodeQL](https://github.com/fhemberger/mqtt_exporter/actions/workflows/codeql-analysis.yml/badge.svg)](https://github.com/fhemberger/mqtt_exporter/actions/workflows/codeql-analysis.yml)![Docker Pulls](https://img.shields.io/docker/pulls/fhemberger/mqtt_exporter) + + +## Features + +- Supported Metrics: + - standard metrics + - Gauge, Counter, Histogram, Summary + - additional + - **Counter (Absolute):** + - Same as Counter, but working with absolute numbers received from MQTT. Which is far more common, than sending the diff in each publish. + - e.g. a network counter or a rain sensor + - **Enum:** + - is a metric type not so common, details can be found in the [OpenMetrics docs](https://github.com/OpenObservability/OpenMetrics/blob/main/specification/OpenMetrics.md#stateset) and [Python client code](https://github.com/prometheus/client_python/blob/9a24236695c9ad47f9dc537a922a6d1333d8d093/prometheus_client/metrics.py#L640-L698). + - Allows to track as state by a know set of strings describing the state, e.g. `on/off` or `high/medium/low` + - Common sources would be a light switch oder a door lock. +- Comprehensive rewriting for topic, value/payload and labels + - similar to prometheus label rewrites + - regex allows almost every conversion + - e.g. to + - remove units or other strings from payload + - convert topic hierarchy into labels + - normalize labels + - check example configs `./exampleconf` and the configs in `./test/test_data/` ## Usage @@ -43,9 +66,16 @@ docker run -d \ - PyYAML - yamlreader -Functional tests are written in `pytest` (see [tests/readme.md](tests/readme.md)), code formatting uses [`autopep8`](https://pypi.org/project/autopep8/) with default settings. If you submit a PR to this repo, please make sure it follows its formatting guidelines. + +## Contribution + +* Contribution is welcome. Fork and then PR. +* Discussions in Issues. +* Functional tests are written in `pytest` (see [tests/readme.md](tests/readme.md)) +* Code formatting uses [`autopep8`](https://pypi.org/project/autopep8/) with default settings. If you submit a PR to this repo, please make sure it follows its formatting guidelines. ## TODO - Add persistence of metrics on restart +- forget/age out metrics receiving no updates anymore diff --git a/exampleconf/histogram.yaml b/exampleconf/histogram.yaml new file mode 100644 index 0000000..255fb65 --- /dev/null +++ b/exampleconf/histogram.yaml @@ -0,0 +1,23 @@ +# histogram metric. with Buckets <= 0.5, 5, 10, +inf + - name: 'network_ping_ms' + help: 'ping response in ms' + type: 'histogram' + topic: 'network/+/+/ping' + parameters: + buckets: + - 0.5 + - 5 + - 10 + label_configs: + - source_labels: ['__msg_topic__'] + target_label: '__topic__' + - source_labels: ["__msg_topic__"] + regex: "network/([^/]+).*" + target_label: "network" + replacement: '\1' + action: "replace" + - source_labels: ["__msg_topic__"] + regex: "network/[^/]+/([^/]+).*" + target_label: "server" + replacement: '\1' + action: "replace" \ No newline at end of file diff --git a/exampleconf/metric_example.yaml b/exampleconf/metric_example.yaml index d1d085e..89164fa 100644 --- a/exampleconf/metric_example.yaml +++ b/exampleconf/metric_example.yaml @@ -3,7 +3,14 @@ metrics: - name: 'mqtt_example' # Required(unique, if multiple, only last entry is kept) help: 'MQTT example gauge' # Required type: 'gauge' # Required ('gauge', 'counter', 'summary' or 'histogram') - #buckets: '.1, 1.0, 10.0, inf' # Optional (Passed as 'buckets' argument to Histogram) + #parameters: # Optional parameters for certain metrics + # buckets: # Optional (Passed as 'buckets' argument to Histogram) + # - .1 + # - 1.0 + # - 10.0 + # states: # Optional (Passes as 'states' arguments to Enum) + # - on + # - off topic: 'example/topic/+' # Required # Inspired by 'https://prometheus.io/docs/operating/configuration/#' diff --git a/exampleconf/switchstate.yaml b/exampleconf/switchstate.yaml new file mode 100644 index 0000000..9c9c85c --- /dev/null +++ b/exampleconf/switchstate.yaml @@ -0,0 +1,23 @@ +# metric for a switch with the state on and off. +# states are case sensitive and must match exactly +# use label_config to rewrite other values, see below. +metrics: + - name: "fhem_light_state" + help: "Light state on/off" + type: "enum" + topic: "fhem/+/+/light" + parameters: + states: + - 'on' + - 'off' + label_configs: + - source_labels: ['__value__'] # replace uppercase ON and 0 with on + regex: "(ON|0)" + target_label: '__value__' + replacement: 'on' + action: "replace" + - source_labels: ['__value__'] # replace uppercase OFF und 1 with off + regex: "(OFF|1)" + target_label: '__value__' + replacement: 'off' + action: "replace" \ No newline at end of file diff --git a/mqtt_exporter.py b/mqtt_exporter.py index f2b071f..5f7d221 100755 --- a/mqtt_exporter.py +++ b/mqtt_exporter.py @@ -1,30 +1,31 @@ #!/usr/bin/env python -from copy import copy, deepcopy +from copy import deepcopy import json -import prometheus_client as prometheus from collections import defaultdict import logging import argparse -import paho.mqtt.client as mqtt -import yaml import os import re import operator import time import signal import sys +import paho.mqtt.client as mqtt +import yaml +import prometheus_client as prometheus from yamlreader import yaml_load import utils.prometheus_additions import version VERSION = version.__version__ SUFFIXES_PER_TYPE = { - "gauge": [''], # add at least an empty suffix + "gauge": [], "counter": ['total'], "counter_absolute": ['total'], "summary": ['sum', 'count'], "histogram": ['sum', 'count', 'bucket'], + "enum": [], } @@ -187,7 +188,7 @@ def _log_setup(logging_config): raise TypeError(f'Invalid log level: {log_level}') if logfile != '': - logging.info('Logging redirected to: ' + logfile) + logging.info(f"Logging redirected to: {logfile}") # Need to replace the current handler on the root logger: file_handler = logging.FileHandler(logfile, 'a') formatter = logging.Formatter('%(asctime)s %(levelname)s: %(message)s') @@ -280,12 +281,11 @@ def _update_metrics(metrics, msg): if not _apply_label_config(labels, metric['label_configs']): continue + # try to convert to float, but leave as is if conversion not possible try: labels['__value__'] = float(labels['__value__'].replace(',', '.')) except ValueError: - logging.exception( - f"__value__ must be a number, was: {labels['__value__']}, Metric: {metric['name']} on __msg_topic_: {labels['__msg_topic__']}") - continue + logging.debug(f"Conversion of {labels['__value__']} to float not possible, continue with value as is.") logging.debug('_update_metrics all labels:') logging.debug(labels) @@ -352,7 +352,9 @@ def _export_to_prometheus(name, metric, labels): 'counter': CounterWrapper, 'counter_absolute': CounterAbsoluteWrapper, 'summary': SummaryWrapper, - 'histogram': HistogramWrapper} + 'histogram': HistogramWrapper, + 'enum': EnumWrapper, + } valid_types = metric_wrappers.keys() if metric['type'] not in valid_types: logging.error( @@ -378,8 +380,11 @@ def _export_to_prometheus(name, metric, labels): metric['prometheus_metric']['parent'] = prometheus_metric else: prometheus_metric = metric['prometheus_metric']['parent'] - - prometheus_metric.update(label_values, value) + try: + prometheus_metric.update(label_values, value) + except ValueError as ve: + logging.error(f"Value {value} is not compatible with metric {metric['name']} of type {metric['type']}") + logging.exception('ve:') logging.debug( f"_export_to_prometheus metric ({metric['type']}): {name}{labels} updated with value: {value}") @@ -421,12 +426,10 @@ class GaugeWrapper(): """ Wrapper to provide generic interface to Gauge metric """ - def __init__(self, name, help_text, label_names, *args, **kwargs) -> None: self.metric = prometheus.Gauge( name, help_text, list(label_names) ) - def update(self, label_values, value): child = self.metric.labels(*label_values) child.set(value) @@ -448,6 +451,10 @@ def update(self, label_values, value): child.inc(value) return child +class HistogramWrapper(): + """ + Wrapper to provide generic interface to Summary metric + """ class CounterAbsoluteWrapper(): """ @@ -489,7 +496,10 @@ class HistogramWrapper(): def __init__(self, name, help_text, label_names, *args, **kwargs) -> None: params = {} if kwargs.get('buckets'): - params['buckets'] = kwargs['buckets'].split(',') + if isinstance(kwargs['buckets'], str): + params['buckets'] = kwargs['buckets'].split(',') + else: + params['buckets'] = kwargs['buckets'] self.metric = prometheus.Histogram( name, help_text, list(label_names), **params @@ -501,6 +511,22 @@ def update(self, label_values, value): return child +class EnumWrapper(): + def __init__(self, name, help_text, label_names, *args, **kwargs) -> None: + params = {} + if kwargs.get('states'): + params['states'] = kwargs['states'] + + self.metric = prometheus.Enum( + name, help_text, list(label_names), **params + ) + + def update(self, label_values, value): + child = self.metric.labels(*label_values) + child.state(value) + return child + + def add_static_metric(timestamp): g = prometheus.Gauge('mqtt_exporter_timestamp', 'Startup time of exporter in millis since EPOC (static)', ['exporter_version']) diff --git a/tests/test_data/test_enum/conf.yaml b/tests/test_data/test_enum/conf.yaml new file mode 100644 index 0000000..0de7a6b --- /dev/null +++ b/tests/test_data/test_enum/conf.yaml @@ -0,0 +1,58 @@ + +# Logging +logging: + # logfile: 'conf/mqttexperter.log' # Optional default '' (stdout) + level: 'debug' # Optional default 'info' + +timescale: 0 + +# Metric definitions +metrics: + - name: "fhem_light_state" + help: "Light state on/off" + type: "enum" + topic: "fhem/+/+/light" + parameters: + states: + - 'on' + - 'off' + label_configs: + - source_labels: ['__value__'] + regex: "(ON|0)" + target_label: '__value__' + replacement: 'on' + action: "replace" + - source_labels: ['__value__'] + regex: "(OFF|1)" + target_label: '__value__' + replacement: 'off' + action: "replace" + - source_labels: ['__msg_topic__'] + target_label: '__topic__' + - source_labels: ["__msg_topic__"] + regex: "fhem/([^/]+).*" + target_label: "location" + replacement: '\1' + action: "replace" + - name: 'network_ping_ms' + help: 'ping response in ms' + type: 'histogram' + topic: 'network/+/+/ping' + parameters: + buckets: + - 0.5 + - 5 + - 10 + label_configs: + - source_labels: ['__msg_topic__'] + target_label: '__topic__' + - source_labels: ["__msg_topic__"] + regex: "network/([^/]+).*" + target_label: "network" + replacement: '\1' + action: "replace" + - source_labels: ["__msg_topic__"] + regex: "network/[^/]+/([^/]+).*" + target_label: "server" + replacement: '\1' + action: "replace" \ No newline at end of file diff --git a/tests/test_data/test_enum/mqtt_msg.csv b/tests/test_data/test_enum/mqtt_msg.csv new file mode 100644 index 0000000..95a6966 --- /dev/null +++ b/tests/test_data/test_enum/mqtt_msg.csv @@ -0,0 +1,23 @@ +in_topic;in_payload;out_name;out_labels;out_value;delay;assert +fhem/room01/desk/light01;on;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};0;4;True +fhem/room01/desk/light01;on;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};0;3;True +fhem/room01/desk/light01;off;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};1;5;True +fhem/room01/desk/light01;on;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};0;4;True +fhem/room01/desk/light01;off;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};1;3;True +fhem/room01/desk/light01;ON;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};0;5;True +fhem/room01/desk/light01;OFF;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};1;4;True +fhem/room01/desk/light01;off;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};1;3;True +fhem/room01/desk/light01;1;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};1;5;True +fhem/room01/desk/light01;0;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};0;4;True +fhem/room01/desk/light01;on;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};0;3;True +fhem/room01/desk/light01;off;fhem_light_state;{"location":"Garten","topic": "fhem/room01/desk/light01"};1;5;True +network/vlan11/srv01.local/ping;2;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "5.0"};{"_count": 1, "_sum": 2, "_bucket": 1};2;True +network/vlan11/srv01.local/ping;4;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "5.0"};{"_count": 2, "_sum": 6, "_bucket": 2};6;True +network/vlan11/srv01.local/ping;7;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "10.0"};{"_count": 3, "_sum": 13, "_bucket": 3};1;True +network/vlan11/srv01.local/ping;0.4;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "0.5"};{"_count": 4, "_sum": 13.4, "_bucket": 1};4;True +network/vlan11/srv01.local/ping;20;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "+Inf"};{"_count": 5, "_sum": 33.4, "_bucket": 5};5;True +network/vlan11/srv01.local/ping;11.1;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "+Inf"};{"_count": 6, "_sum": 44.5, "_bucket": 6};2;True +network/vlan11/srv01.local/ping;5;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "5.0"};{"_count": 7, "_sum": 49.5, "_bucket": 4};4;True +network/vlan11/srv01.local/ping;6;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "10.0"};{"_count": 8, "_sum": 55.5, "_bucket": 6};1;True +network/vlan11/srv01.local/ping;0.05;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "0.5"};{"_count": 9, "_sum": 55.55, "_bucket": 2};4;True +network/vlan11/srv01.local/ping;30;network_ping_ms;{"network": "vlan11","topic": "network/vlan11/srv01.local/ping", "server": "srv01.local", "le": "+Inf"};{"_count": 10, "_sum": 85.55, "_bucket": 10};5;True \ No newline at end of file diff --git a/tests/test_mqtt_exporter.py b/tests/test_mqtt_exporter.py index 946d223..114bd34 100644 --- a/tests/test_mqtt_exporter.py +++ b/tests/test_mqtt_exporter.py @@ -62,7 +62,11 @@ def _get_mqtt_data(file_name): # covert payloud to bytes, as in a MQTT Message row[MqttCVS.in_payload] = row[MqttCVS.in_payload].encode('UTF-8') # parse labels, to a python object. - row[MqttCVS.out_labels] = json.loads(row.get(MqttCVS.out_labels, '{}')) + try: + row[MqttCVS.out_labels] = json.loads(row.get(MqttCVS.out_labels, '{}')) + except json.decoder.JSONDecodeError as jde: + logging.error(f"json.decoder.JSONDecodeError while decoding {row.get(MqttCVS.out_labels, '{}')}") + raise jde # Value could be a JSON, a float or anthing else. try: row[MqttCVS.out_value] = float(row.get(MqttCVS.out_value))