|
20 | 20 | from chip.clusters.ClusterObjects import ALL_ATTRIBUTES, ALL_CLUSTERS, Cluster
|
21 | 21 | from chip.exceptions import ChipStackError
|
22 | 22 | from chip.native import PyChipError
|
23 |
| -from zeroconf import IPVersion, ServiceStateChange, Zeroconf |
| 23 | +from zeroconf import BadTypeInNameException, IPVersion, ServiceStateChange, Zeroconf |
24 | 24 | from zeroconf.asyncio import AsyncServiceBrowser, AsyncServiceInfo, AsyncZeroconf
|
25 | 25 |
|
26 | 26 | from matter_server.common.models import CommissionableNodeData, CommissioningParameters
|
|
72 | 72 | NODE_RESUBSCRIBE_TIMEOUT_OFFLINE = 30 * 60 * 1000
|
73 | 73 | NODE_PING_TIMEOUT = 10
|
74 | 74 | NODE_PING_TIMEOUT_BATTERY_POWERED = 60
|
75 |
| -NODE_MDNS_BACKOFF = 60 |
| 75 | +NODE_MDNS_BACKOFF = 300 |
76 | 76 | FALLBACK_NODE_SCANNER_INTERVAL = 1800
|
77 | 77 |
|
78 | 78 | MDNS_TYPE_OPERATIONAL_NODE = "_matter._tcp.local."
|
@@ -119,6 +119,7 @@ def __init__(
|
119 | 119 | max_workers=1, thread_name_prefix="SDKExecutor"
|
120 | 120 | )
|
121 | 121 | self._node_setup_throttle = asyncio.Semaphore(10)
|
| 122 | + self._mdns_event_timer: dict[str, asyncio.TimerHandle] = {} |
122 | 123 |
|
123 | 124 | async def initialize(self) -> None:
|
124 | 125 | """Async initialize of controller."""
|
@@ -1198,66 +1199,101 @@ def _on_mdns_service_state_change(
|
1198 | 1199 | name: str,
|
1199 | 1200 | state_change: ServiceStateChange,
|
1200 | 1201 | ) -> None:
|
1201 |
| - LOGGER.debug("Received %s MDNS event for %s", state_change, name) |
| 1202 | + # mdns events may arrive in bursts of (duplicate) messages |
| 1203 | + # so we debounce this with a timer handle. |
| 1204 | + if state_change == ServiceStateChange.Removed: |
| 1205 | + # if we have an existing timer for this name, cancel it. |
| 1206 | + if cancel := self._mdns_event_timer.pop(name, None): |
| 1207 | + cancel.cancel() |
| 1208 | + if service_type == MDNS_TYPE_OPERATIONAL_NODE: |
| 1209 | + # we're not interested in operational node removals, |
| 1210 | + # this is already handled by the subscription logic |
| 1211 | + return |
| 1212 | + |
| 1213 | + if name in self._mdns_event_timer: |
| 1214 | + # We already have a timer to resolve this service, so ignore this callback. |
| 1215 | + return |
| 1216 | + |
| 1217 | + if TYPE_CHECKING: |
| 1218 | + assert self.server.loop |
| 1219 | + |
1202 | 1220 | if service_type == MDNS_TYPE_COMMISSIONABLE_NODE:
|
1203 |
| - asyncio.create_task( |
1204 |
| - self._on_mdns_commissionable_node_state(name, state_change) |
| 1221 | + # process the event with a debounce timer |
| 1222 | + self._mdns_event_timer[name] = self.server.loop.call_later( |
| 1223 | + 0.5, self._on_mdns_commissionable_node_state, name, state_change |
1205 | 1224 | )
|
1206 | 1225 | return
|
| 1226 | + |
1207 | 1227 | if service_type == MDNS_TYPE_OPERATIONAL_NODE:
|
1208 |
| - self._on_mdns_operational_node_state(name, state_change) |
| 1228 | + if self.fabric_id_hex not in name.lower(): |
| 1229 | + # filter out messages that are not for our fabric |
| 1230 | + return |
| 1231 | + # process the event with a debounce timer |
| 1232 | + self._mdns_event_timer[name] = self.server.loop.call_later( |
| 1233 | + 0.5, self._on_mdns_operational_node_state, name, state_change |
| 1234 | + ) |
1209 | 1235 |
|
1210 | 1236 | def _on_mdns_operational_node_state(
|
1211 | 1237 | self, name: str, state_change: ServiceStateChange
|
1212 | 1238 | ) -> None:
|
1213 | 1239 | """Handle a (operational) Matter node MDNS state change."""
|
1214 |
| - name = name.lower() |
1215 |
| - if self.fabric_id_hex not in name: |
1216 |
| - # filter out messages that are not for our fabric |
1217 |
| - return |
1218 |
| - |
1219 |
| - if state_change == ServiceStateChange.Removed: |
1220 |
| - # we're not interested in removals as this is already |
1221 |
| - # handled in the subscription logic |
1222 |
| - return |
1223 |
| - |
| 1240 | + self._mdns_event_timer.pop(name, None) |
| 1241 | + logger = LOGGER.getChild("mdns") |
1224 | 1242 | # the mdns name is constructed as [fabricid]-[nodeid]._matter._tcp.local.
|
1225 | 1243 | # extract the node id from the name
|
1226 | 1244 | node_id = int(name.split("-")[1].split(".")[0], 16)
|
1227 | 1245 |
|
1228 | 1246 | if not (node := self._nodes.get(node_id)):
|
1229 | 1247 | return # this should not happen, but guard just in case
|
1230 | 1248 |
|
1231 |
| - # mdns events for matter devices arrive in bursts of (duplicate) messages |
1232 |
| - # so we debounce this as we only use the mdns messages for operational node discovery |
1233 |
| - # and we have other logic in place to determine node aliveness |
1234 | 1249 | now = time.time()
|
1235 | 1250 | last_seen = self._node_last_seen.get(node_id, 0)
|
1236 |
| - if node.available and now - last_seen < NODE_MDNS_BACKOFF: |
1237 |
| - return |
1238 | 1251 | self._node_last_seen[node_id] = now
|
1239 | 1252 |
|
1240 |
| - # we treat UPDATE state changes as ADD if the node is marked as |
| 1253 | + # we only treat UPDATE state changes as ADD if the node is marked as |
1241 | 1254 | # unavailable to ensure we catch a node being operational
|
1242 | 1255 | if node.available and state_change == ServiceStateChange.Updated:
|
1243 | 1256 | return
|
1244 | 1257 |
|
1245 | 1258 | if node_id in self._nodes_in_setup:
|
1246 | 1259 | # prevent duplicate setup actions
|
1247 | 1260 | return
|
1248 |
| - LOGGER.info("Node %s (re)discovered on MDNS", node_id) |
| 1261 | + |
| 1262 | + if node_id not in self._subscriptions: |
| 1263 | + logger.info("Node %s discovered on MDNS", node_id) |
| 1264 | + elif (now - last_seen) > NODE_MDNS_BACKOFF: |
| 1265 | + # node came back online after being offline for a while or restarted |
| 1266 | + logger.info("Node %s re-discovered on MDNS", node_id) |
| 1267 | + else: |
| 1268 | + # ignore all other cases |
| 1269 | + return |
| 1270 | + |
1249 | 1271 | # setup the node - this will (re) setup the subscriptions etc.
|
1250 | 1272 | asyncio.create_task(self._setup_node(node_id))
|
1251 | 1273 |
|
1252 |
| - async def _on_mdns_commissionable_node_state( |
| 1274 | + def _on_mdns_commissionable_node_state( |
1253 | 1275 | self, name: str, state_change: ServiceStateChange
|
1254 | 1276 | ) -> None:
|
1255 | 1277 | """Handle a (commissionable) Matter node MDNS state change."""
|
1256 |
| - if state_change == ServiceStateChange.Added: |
| 1278 | + self._mdns_event_timer.pop(name, None) |
| 1279 | + logger = LOGGER.getChild("mdns") |
| 1280 | + |
| 1281 | + try: |
1257 | 1282 | info = AsyncServiceInfo(MDNS_TYPE_COMMISSIONABLE_NODE, name)
|
1258 |
| - assert self._aiozc is not None |
| 1283 | + except BadTypeInNameException as ex: |
| 1284 | + logger.debug("Ignoring record with bad type in name: %s: %s", name, ex) |
| 1285 | + return |
| 1286 | + |
| 1287 | + async def handle_commissionable_node_added() -> None: |
| 1288 | + if TYPE_CHECKING: |
| 1289 | + assert self._aiozc is not None |
1259 | 1290 | await info.async_request(self._aiozc.zeroconf, 3000)
|
1260 |
| - LOGGER.debug("Discovered commissionable Matter node using MDNS: %s", info) |
| 1291 | + logger.debug("Discovered commissionable Matter node: %s", info) |
| 1292 | + |
| 1293 | + if state_change == ServiceStateChange.Added: |
| 1294 | + asyncio.create_task(handle_commissionable_node_added()) |
| 1295 | + elif state_change == ServiceStateChange.Removed: |
| 1296 | + logger.debug("Commissionable Matter node disappeared: %s", info) |
1261 | 1297 |
|
1262 | 1298 | def _write_node_state(self, node_id: int, force: bool = False) -> None:
|
1263 | 1299 | """Schedule the write of the current node state to persistent storage."""
|
|
0 commit comments