Skip to content

Commit acb33e3

Browse files
committed
better debouncing of mdns
1 parent a282370 commit acb33e3

File tree

1 file changed

+63
-27
lines changed

1 file changed

+63
-27
lines changed

matter_server/server/device_controller.py

+63-27
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@
2020
from chip.clusters.ClusterObjects import ALL_ATTRIBUTES, ALL_CLUSTERS, Cluster
2121
from chip.exceptions import ChipStackError
2222
from chip.native import PyChipError
23-
from zeroconf import IPVersion, ServiceStateChange, Zeroconf
23+
from zeroconf import BadTypeInNameException, IPVersion, ServiceStateChange, Zeroconf
2424
from zeroconf.asyncio import AsyncServiceBrowser, AsyncServiceInfo, AsyncZeroconf
2525

2626
from matter_server.common.models import CommissionableNodeData, CommissioningParameters
@@ -72,7 +72,7 @@
7272
NODE_RESUBSCRIBE_TIMEOUT_OFFLINE = 30 * 60 * 1000
7373
NODE_PING_TIMEOUT = 10
7474
NODE_PING_TIMEOUT_BATTERY_POWERED = 60
75-
NODE_MDNS_BACKOFF = 60
75+
NODE_MDNS_BACKOFF = 300
7676
FALLBACK_NODE_SCANNER_INTERVAL = 1800
7777

7878
MDNS_TYPE_OPERATIONAL_NODE = "_matter._tcp.local."
@@ -119,6 +119,7 @@ def __init__(
119119
max_workers=1, thread_name_prefix="SDKExecutor"
120120
)
121121
self._node_setup_throttle = asyncio.Semaphore(10)
122+
self._mdns_event_timer: dict[str, asyncio.TimerHandle] = {}
122123

123124
async def initialize(self) -> None:
124125
"""Async initialize of controller."""
@@ -1198,66 +1199,101 @@ def _on_mdns_service_state_change(
11981199
name: str,
11991200
state_change: ServiceStateChange,
12001201
) -> None:
1201-
LOGGER.debug("Received %s MDNS event for %s", state_change, name)
1202+
# mdns events may arrive in bursts of (duplicate) messages
1203+
# so we debounce this with a timer handle.
1204+
if state_change == ServiceStateChange.Removed:
1205+
# if we have an existing timer for this name, cancel it.
1206+
if cancel := self._mdns_event_timer.pop(name, None):
1207+
cancel.cancel()
1208+
if service_type == MDNS_TYPE_OPERATIONAL_NODE:
1209+
# we're not interested in operational node removals,
1210+
# this is already handled by the subscription logic
1211+
return
1212+
1213+
if name in self._mdns_event_timer:
1214+
# We already have a timer to resolve this service, so ignore this callback.
1215+
return
1216+
1217+
if TYPE_CHECKING:
1218+
assert self.server.loop
1219+
12021220
if service_type == MDNS_TYPE_COMMISSIONABLE_NODE:
1203-
asyncio.create_task(
1204-
self._on_mdns_commissionable_node_state(name, state_change)
1221+
# process the event with a debounce timer
1222+
self._mdns_event_timer[name] = self.server.loop.call_later(
1223+
0.5, self._on_mdns_commissionable_node_state, name, state_change
12051224
)
12061225
return
1226+
12071227
if service_type == MDNS_TYPE_OPERATIONAL_NODE:
1208-
self._on_mdns_operational_node_state(name, state_change)
1228+
if self.fabric_id_hex not in name.lower():
1229+
# filter out messages that are not for our fabric
1230+
return
1231+
# process the event with a debounce timer
1232+
self._mdns_event_timer[name] = self.server.loop.call_later(
1233+
0.5, self._on_mdns_operational_node_state, name, state_change
1234+
)
12091235

12101236
def _on_mdns_operational_node_state(
12111237
self, name: str, state_change: ServiceStateChange
12121238
) -> None:
12131239
"""Handle a (operational) Matter node MDNS state change."""
1214-
name = name.lower()
1215-
if self.fabric_id_hex not in name:
1216-
# filter out messages that are not for our fabric
1217-
return
1218-
1219-
if state_change == ServiceStateChange.Removed:
1220-
# we're not interested in removals as this is already
1221-
# handled in the subscription logic
1222-
return
1223-
1240+
self._mdns_event_timer.pop(name, None)
1241+
logger = LOGGER.getChild("mdns")
12241242
# the mdns name is constructed as [fabricid]-[nodeid]._matter._tcp.local.
12251243
# extract the node id from the name
12261244
node_id = int(name.split("-")[1].split(".")[0], 16)
12271245

12281246
if not (node := self._nodes.get(node_id)):
12291247
return # this should not happen, but guard just in case
12301248

1231-
# mdns events for matter devices arrive in bursts of (duplicate) messages
1232-
# so we debounce this as we only use the mdns messages for operational node discovery
1233-
# and we have other logic in place to determine node aliveness
12341249
now = time.time()
12351250
last_seen = self._node_last_seen.get(node_id, 0)
1236-
if node.available and now - last_seen < NODE_MDNS_BACKOFF:
1237-
return
12381251
self._node_last_seen[node_id] = now
12391252

1240-
# we treat UPDATE state changes as ADD if the node is marked as
1253+
# we only treat UPDATE state changes as ADD if the node is marked as
12411254
# unavailable to ensure we catch a node being operational
12421255
if node.available and state_change == ServiceStateChange.Updated:
12431256
return
12441257

12451258
if node_id in self._nodes_in_setup:
12461259
# prevent duplicate setup actions
12471260
return
1248-
LOGGER.info("Node %s (re)discovered on MDNS", node_id)
1261+
1262+
if node_id not in self._subscriptions:
1263+
logger.info("Node %s discovered on MDNS", node_id)
1264+
elif (now - last_seen) > NODE_MDNS_BACKOFF:
1265+
# node came back online after being offline for a while or restarted
1266+
logger.info("Node %s re-discovered on MDNS", node_id)
1267+
else:
1268+
# ignore all other cases
1269+
return
1270+
12491271
# setup the node - this will (re) setup the subscriptions etc.
12501272
asyncio.create_task(self._setup_node(node_id))
12511273

1252-
async def _on_mdns_commissionable_node_state(
1274+
def _on_mdns_commissionable_node_state(
12531275
self, name: str, state_change: ServiceStateChange
12541276
) -> None:
12551277
"""Handle a (commissionable) Matter node MDNS state change."""
1256-
if state_change == ServiceStateChange.Added:
1278+
self._mdns_event_timer.pop(name, None)
1279+
logger = LOGGER.getChild("mdns")
1280+
1281+
try:
12571282
info = AsyncServiceInfo(MDNS_TYPE_COMMISSIONABLE_NODE, name)
1258-
assert self._aiozc is not None
1283+
except BadTypeInNameException as ex:
1284+
logger.debug("Ignoring record with bad type in name: %s: %s", name, ex)
1285+
return
1286+
1287+
async def handle_commissionable_node_added() -> None:
1288+
if TYPE_CHECKING:
1289+
assert self._aiozc is not None
12591290
await info.async_request(self._aiozc.zeroconf, 3000)
1260-
LOGGER.debug("Discovered commissionable Matter node using MDNS: %s", info)
1291+
logger.debug("Discovered commissionable Matter node: %s", info)
1292+
1293+
if state_change == ServiceStateChange.Added:
1294+
asyncio.create_task(handle_commissionable_node_added())
1295+
elif state_change == ServiceStateChange.Removed:
1296+
logger.debug("Commissionable Matter node disappeared: %s", info)
12611297

12621298
def _write_node_state(self, node_id: int, force: bool = False) -> None:
12631299
"""Schedule the write of the current node state to persistent storage."""

0 commit comments

Comments
 (0)