Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add more prometheus labels #128607

Draft
wants to merge 55 commits into
base: dev
Choose a base branch
from
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
55 commits
Select commit Hold shift + click to select a range
cf430ab
First pass at adding prometheus labels
jzucker2 Oct 17, 2024
56927d6
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Oct 17, 2024
06b619a
Small change to start prepping tests
jzucker2 Oct 17, 2024
71a6a28
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 23, 2024
821af8c
Catching back up after a minute
jzucker2 Nov 23, 2024
cb1d0ec
And again with moar fixez
jzucker2 Nov 23, 2024
0e12d02
It still works
jzucker2 Nov 23, 2024
79c8f4b
Getting closer I think
jzucker2 Nov 23, 2024
e8123bf
Trying to force some basic labels in
jzucker2 Nov 23, 2024
3f386d5
Starting to add more labels
jzucker2 Nov 23, 2024
330cf67
This feels like a mess
jzucker2 Nov 24, 2024
e93a648
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 24, 2024
4b89077
Can't get area working
jzucker2 Nov 24, 2024
579900c
Can't make the tests notice the area
jzucker2 Nov 24, 2024
2e8ae04
Getting closer to useful
jzucker2 Nov 24, 2024
a5a99bd
Finally getting closer
jzucker2 Nov 24, 2024
e20ce99
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 24, 2024
e79b198
Is this better?
jzucker2 Nov 24, 2024
f777933
More clean up
jzucker2 Nov 24, 2024
f8d32ec
More clean up
jzucker2 Nov 24, 2024
4cc7b79
Cleaned up a lot and added mocks for devices to many entities
jzucker2 Nov 24, 2024
b5fbfb2
This is good
jzucker2 Nov 24, 2024
86f901a
Trying to add more mocks and tests for devices and areas
jzucker2 Nov 24, 2024
9b20f1c
t got stupid at the end
jzucker2 Nov 24, 2024
bdd6176
Added basic label tests for everything
jzucker2 Nov 24, 2024
2f9ef5e
Cleaned this all up again and now I'm ready for checking
jzucker2 Nov 24, 2024
7320a3e
Finally ready to move forward
jzucker2 Nov 24, 2024
1a4fa88
More tests added
jzucker2 Nov 24, 2024
eb4ccb0
Added a test to non unit device and area too
jzucker2 Nov 24, 2024
868f40e
One last pass on adding basic entity types
jzucker2 Nov 24, 2024
28b5f3b
This really fell apart at the end
jzucker2 Nov 24, 2024
e0fefa2
Adding more tests
jzucker2 Nov 24, 2024
d6e7962
OOps, had that twice
jzucker2 Nov 24, 2024
5bf3c34
I got pretty close here
jzucker2 Nov 24, 2024
bed2254
Another pass on consolidating devices and areas
jzucker2 Nov 24, 2024
b0dbe25
Getting closer to most working examples
jzucker2 Nov 24, 2024
1637ece
Another pass on entities
jzucker2 Nov 24, 2024
05012d5
Another pass on stuff
jzucker2 Nov 24, 2024
45a719e
Renaming and global config
jzucker2 Nov 24, 2024
39e9380
Now this is funny
jzucker2 Nov 24, 2024
cce2fbb
Another pass on refactoring
jzucker2 Nov 24, 2024
1229ae3
And again but simplified
jzucker2 Nov 24, 2024
351eb55
Getting much closer now
jzucker2 Nov 24, 2024
508ff60
Well now I'm covering most optimistic paths
jzucker2 Nov 24, 2024
ddb40ce
Successfully fixed up a ton of tests
jzucker2 Nov 24, 2024
f674d3e
Need to handle state changes better
jzucker2 Nov 24, 2024
475a1ed
Stopping point with tests but needs functionality fixes
jzucker2 Nov 24, 2024
2eb5d54
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 24, 2024
65b5789
Finally getting close to something
jzucker2 Nov 24, 2024
90e91ef
Actually testing area now
jzucker2 Nov 24, 2024
2fe6344
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 24, 2024
e53528f
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 25, 2024
3288e3a
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 28, 2024
c856d78
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 30, 2024
365a992
Merge branch 'dev' into experimental-add-more-prometheus-labels
jzucker2 Nov 30, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
184 changes: 160 additions & 24 deletions homeassistant/components/prometheus/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@

from collections.abc import Callable
from contextlib import suppress
from enum import Enum
import logging
import string
from typing import Any, cast
Expand Down Expand Up @@ -43,8 +44,10 @@
from homeassistant.components.light import ATTR_BRIGHTNESS
from homeassistant.components.sensor import SensorDeviceClass
from homeassistant.const import (
ATTR_AREA_ID,
ATTR_BATTERY_LEVEL,
ATTR_DEVICE_CLASS,
ATTR_DEVICE_ID,
ATTR_FRIENDLY_NAME,
ATTR_MODE,
ATTR_TEMPERATURE,
Expand All @@ -62,7 +65,13 @@
UnitOfTemperature,
)
from homeassistant.core import Event, EventStateChangedData, HomeAssistant, State
from homeassistant.helpers import entityfilter, state as state_helper
from homeassistant.helpers import (
area_registry as ar,
device_registry as dr,
entity_registry as er,
entityfilter,
state as state_helper,
)
import homeassistant.helpers.config_validation as cv
from homeassistant.helpers.entity_registry import (
EVENT_ENTITY_REGISTRY_UPDATED,
Expand Down Expand Up @@ -136,11 +145,18 @@
conf[CONF_COMPONENT_CONFIG_GLOB],
)

area_registry = ar.async_get(hass)
device_registry = dr.async_get(hass)
entity_registry = er.async_get(hass)

metrics = PrometheusMetrics(
entity_filter,
namespace,
climate_units,
component_config,
area_registry,
device_registry,
entity_registry,
override_metric,
default_metric,
)
Expand All @@ -158,6 +174,63 @@
return True


class PrometheusLabelsException(Exception):
"""Exceptions when dealing with shared PrometheusLabels functionality."""


class PrometheusLabels(Enum):
"""Model shared Prometheus labels."""

ENTITY = "entity"
FRIENDLY_NAME = "friendly_name"
OBJECT_ID = "object_id"
DOMAIN = "domain"
DEVICE = "device"
AREA = "area"
PLATFORM = "platform"
UNKNOWN = "unknown" # mostly just for testing

@classmethod
def get_shared_common_labels(cls) -> list[PrometheusLabels]:
"""Return all shared prometheus labels that are always expected."""
return [
cls.ENTITY,
cls.OBJECT_ID,
cls.DOMAIN,
cls.FRIENDLY_NAME,
]

@classmethod
def get_all_common_label_strings(cls) -> list[str]:
"""Return all possible common prometheus label strings."""
return [p.value for p in cls if p != cls.UNKNOWN]

@classmethod
def label_value_from_state(cls, label: PrometheusLabels, state: State) -> str:
"""Return a label value for a metric from a hass state."""
if label == cls.ENTITY:
return state.entity_id
if label == cls.OBJECT_ID:
return state.object_id
if label == cls.DOMAIN:
return state.domain
if label == cls.FRIENDLY_NAME:
return state.attributes.get(ATTR_FRIENDLY_NAME) or ""
raise PrometheusLabelsException(f"Unexpected label: {label}")

def label_value(self, state: State) -> str:
"""Return a label value as an instance shortcut to `cls.label_value_from_state`."""
return self.label_value_from_state(self, state)

@classmethod
def get_shared_common_label_dict(cls, state: State) -> dict[str, str]:
"""Return a dict of label and values for all shared expected metrics for a state."""
final_labels = {}
for label in cls.get_shared_common_labels():
final_labels[label.value] = label.label_value(state)
return dict(final_labels)


class PrometheusMetrics:
"""Model all of the metrics which should be exposed to Prometheus."""

Expand All @@ -167,11 +240,17 @@
namespace: str,
climate_units: UnitOfTemperature,
component_config: EntityValues,
area_registry: ar.AreaRegistry,
device_registry: dr.DeviceRegistry,
entity_registry: er.EntityRegistry,
override_metric: str | None,
default_metric: str | None,
) -> None:
"""Initialize Prometheus Metrics."""
self._component_config = component_config
self._area_registry = area_registry
self._device_registry = device_registry
self._entity_registry = entity_registry
self._override_metric = override_metric
self._default_metric = default_metric
self._filter = entity_filter
Expand All @@ -198,14 +277,28 @@
if (state := event.data.get("new_state")) is None:
return

# Need to handle state changes for area and device here
if not self._filter(state.entity_id):
_LOGGER.debug("Filtered out entity %s", state.entity_id)
return

if (old_state := event.data.get("old_state")) is not None and (
old_friendly_name := old_state.attributes.get(ATTR_FRIENDLY_NAME)
) != state.attributes.get(ATTR_FRIENDLY_NAME):
self._remove_labelsets(old_state.entity_id, old_friendly_name)
if (old_state := event.data.get("old_state")) is not None:
removal_kwargs = {}
if (
old_friendly_name := old_state.attributes.get(ATTR_FRIENDLY_NAME)
) != state.attributes.get(ATTR_FRIENDLY_NAME):
removal_kwargs["friendly_name"] = old_friendly_name
if (
old_area_id := old_state.attributes.get(ATTR_AREA_ID)
) != state.attributes.get(ATTR_AREA_ID):
old_area = self._area_registry.async_get_area(str(old_area_id))
if old_area and (old_area_name := old_area.name):
removal_kwargs["area"] = old_area_name
else:
removal_kwargs["area"] = old_area_id

Check warning on line 298 in homeassistant/components/prometheus/__init__.py

View check run for this annotation

Codecov / codecov/patch

homeassistant/components/prometheus/__init__.py#L298

Added line #L298 was not covered by tests

if removal_kwargs:
self._remove_labelsets(old_state.entity_id, **removal_kwargs)

self.handle_state(state)

Expand Down Expand Up @@ -237,8 +330,12 @@
if state.state in IGNORED_STATES:
self._remove_labelsets(
entity_id,
None,
{state_change, entity_available, last_updated_time_seconds},
friendly_name=None,
ignored_metrics={
state_change,
entity_available,
last_updated_time_seconds,
},
)
else:
domain, _ = hacore.split_entity_id(entity_id)
Expand Down Expand Up @@ -275,6 +372,7 @@
self,
entity_id: str,
friendly_name: str | None = None,
area: str | None = None,
ignored_metrics: set[MetricWrapperBase] | None = None,
) -> None:
"""Remove labelsets matching the given entity id from all non-ignored metrics."""
Expand All @@ -286,16 +384,30 @@
for sample in cast(list[prometheus_client.Metric], metric.collect())[
0
].samples:
if sample.labels["entity"] == entity_id and (
not friendly_name or sample.labels["friendly_name"] == friendly_name
):
_LOGGER.debug(
"Removing labelset from %s for entity_id: %s",
sample.name,
entity_id,
)
with suppress(KeyError):
metric.remove(*sample.labels.values())
if sample.labels["entity"] == entity_id:
if (
not friendly_name
or sample.labels["friendly_name"] == friendly_name
):
_LOGGER.debug(
"!!!!!!! friendly_name Removing labelset (%s, %s) from %s for entity_id: %s",
friendly_name,
area,
sample.name,
entity_id,
)
with suppress(KeyError):
metric.remove(*sample.labels.values())
if not area or sample.labels["area"] == area:
_LOGGER.debug(
"!!!!!!! area Removing labelset (%s, %s) from %s for entity_id: %s",
friendly_name,
area,
sample.name,
entity_id,
)
with suppress(KeyError):
metric.remove(*sample.labels.values())

def _handle_attributes(self, state: State) -> None:
for key, value in state.attributes.items():
Expand All @@ -318,7 +430,7 @@
documentation: str,
extra_labels: list[str] | None = None,
) -> _MetricBaseT:
labels = ["entity", "friendly_name", "domain"]
labels = PrometheusLabels.get_all_common_label_strings()
if extra_labels is not None:
labels.extend(extra_labels)

Expand Down Expand Up @@ -355,14 +467,39 @@
value = None
return value

@staticmethod
def _labels(state: State) -> dict[str, Any]:
def _get_extra_labels(self, state: State) -> dict[str, Any]:
"""Return a dict of extra labels, or None if no extra labels necessary."""
final_area = ""
final_device = ""
final_platform = ""
if entity := self._entity_registry.async_get(state.entity_id):
final_platform = entity.platform
if device_id := state.attributes.get(ATTR_DEVICE_ID):
if device := self._device_registry.async_get(device_id):
if device_name := device.name:
final_device = device_name
else:
final_device = device_id

Check warning on line 482 in homeassistant/components/prometheus/__init__.py

View check run for this annotation

Codecov / codecov/patch

homeassistant/components/prometheus/__init__.py#L482

Added line #L482 was not covered by tests
if area_id := state.attributes.get(ATTR_AREA_ID):
if area := self._area_registry.async_get_area(area_id):
if area_name := area.name:
final_area = area_name
else:
final_area = area_id

Check warning on line 488 in homeassistant/components/prometheus/__init__.py

View check run for this annotation

Codecov / codecov/patch

homeassistant/components/prometheus/__init__.py#L488

Added line #L488 was not covered by tests
return {
"entity": state.entity_id,
"domain": state.domain,
"friendly_name": state.attributes.get(ATTR_FRIENDLY_NAME),
"platform": final_platform,
"area": final_area,
"device": final_device,
}

def _labels(self, state: State) -> dict[str, Any]:
final_labels = PrometheusLabels.get_shared_common_label_dict(state)

if extra_labels := self._get_extra_labels(state):
final_labels.update(extra_labels)

return dict(final_labels)

def _battery(self, state: State) -> None:
if (battery_level := state.attributes.get(ATTR_BATTERY_LEVEL)) is not None:
metric = self._metric(
Expand Down Expand Up @@ -632,7 +769,6 @@
documentation = "State of the sensor"
if unit:
documentation = f"Sensor data measured in {unit}"

_metric = self._metric(metric, prometheus_client.Gauge, documentation)

if (value := self.state_as_number(state)) is not None:
Expand Down
Loading