diff --git a/src/service/10-link-local-mgmt b/src/service/10-link-local-mgmt index 3908060..e4e7b86 100644 --- a/src/service/10-link-local-mgmt +++ b/src/service/10-link-local-mgmt @@ -40,19 +40,45 @@ update_avahi() { | grep -v '^169\.254\.' \ | head -n1) + local new_content="" + if [ -n "$dhcp_ip" ]; then + new_content="$dhcp_ip $hostname $hostname.local" + fi + + local current_content + current_content=$(cat /etc/avahi/hosts 2>/dev/null || echo "") + + if [ "$new_content" = "$current_content" ]; then + logger -t nm-link-local "Avahi: hosts unchanged, skipping reload" + return + fi + if [ -n "$dhcp_ip" ]; then mkdir -p /etc/avahi - echo "$dhcp_ip $hostname $hostname.local" > /etc/avahi/hosts + echo "$new_content" > /etc/avahi/hosts logger -t nm-link-local "Avahi: pinned $hostname -> $dhcp_ip" else rm -f /etc/avahi/hosts logger -t nm-link-local "Avahi: removed hosts pin, using all addresses" fi - systemctl restart avahi-daemon 2>/dev/null + systemctl reload avahi-daemon 2>/dev/null || systemctl restart avahi-daemon 2>/dev/null } case "$ACTION" in - up|dhcp4-change) + up) + # On 'up' the interface may still carry a stale DHCP address from the previous + # session (NM hasn't cleaned it up yet). Reading ip-addr here is unreliable. + # Always re-enable link-local as a clean slate; let dhcp4-change suppress it + # later if a real DHCP lease is obtained. + logger -t nm-link-local "[$INTERFACE] Up — ensuring link-local active (clean slate)" + (sleep 2 && nmcli device modify "$INTERFACE" ipv4.link-local enabled 2>/dev/null \ + && logger -t nm-link-local "[$INTERFACE] Link-local explicitly enabled on up") & + update_avahi + ;; + + dhcp4-change) + # dhcp4-change fires only when DHCP actually succeeds (new/renewed lease). + # At this point the DHCP IP is reliably present — safe to read and suppress link-local. DHCP_IP=$(ip -4 addr show "$INTERFACE" 2>/dev/null \ | grep -oP '(?<=inet\s)\d+(\.\d+){3}' \ | grep -v '^127\.' \ @@ -60,24 +86,19 @@ case "$ACTION" in | head -n1) if [ -n "$DHCP_IP" ]; then - logger -t nm-link-local "[$INTERFACE] DHCP $DHCP_IP detected — suppressing link-local (session only)" - # Use device modify (not connection modify) so the persistent profile keeps - # ipv4.link-local=enabled. This ensures direct-connect plug-ins always activate. + logger -t nm-link-local "[$INTERFACE] DHCP $DHCP_IP confirmed — suppressing link-local (session only)" # Run in background after a delay — nmcli blocks on NM, which is waiting for # this dispatcher to return, causing a deadlock if called synchronously. (sleep 2 && nmcli device modify "$INTERFACE" ipv4.link-local disabled 2>/dev/null \ && logger -t nm-link-local "[$INTERFACE] Link-local suppressed for current session") & - else - logger -t nm-link-local "[$INTERFACE] No DHCP on $INTERFACE — keeping link-local active" fi update_avahi ;; down) - # Profile always has ipv4.link-local=enabled so no action needed here. - # The suppression from device modify was session-only and is gone when the - # connection goes down. - logger -t nm-link-local "[$INTERFACE] Down — link-local will be active on next connect" + # NOTE: a carrier-change does NOT fully reset session-level 'device modify' state. + # The re-enable is therefore handled in the 'up' handler when no DHCP is detected. + logger -t nm-link-local "[$INTERFACE] Down — link-local will be re-enabled on next up without DHCP" update_avahi ;; esac diff --git a/src/service/update_and_run_server_and_frontend.sh b/src/service/update_and_run_server_and_frontend.sh index f6b8159..f3cbe46 100755 --- a/src/service/update_and_run_server_and_frontend.sh +++ b/src/service/update_and_run_server_and_frontend.sh @@ -8,8 +8,17 @@ set -e # Enable link-local for all wired ethernet connections while IFS=: read -r name type; do if [[ "$type" == *"ethernet"* ]]; then - echo "Enabling IPv4 link-local for connection: $name" + echo "Configuring connection: $name" + # link-local: always enabled so direct-connect (no DHCP) works immediately sudo nmcli connection modify "$name" ipv4.link-local enabled 2>/dev/null || echo "Failed to modify $name" + # may-fail=yes: do NOT tear down the connection when DHCP times out. + # Without this, NM declares ip-config-unavailable after the 45s DHCP timeout + # and enters a reconnect loop that causes ~1.5 min outages every ~45 seconds. + sudo nmcli connection modify "$name" ipv4.may-fail yes 2>/dev/null || echo "Failed to set may-fail on $name" + # Infinite DHCP timeout: NM keeps retrying DHCP in the background but never + # declares ip-config-unavailable. This prevents the 45s reconnect loop that + # kills the link-local address in direct-connect (no DHCP server) scenarios. + sudo nmcli connection modify "$name" ipv4.dhcp-timeout infinity 2>/dev/null || echo "Failed to set dhcp-timeout on $name" sudo nmcli connection up "$name" 2>/dev/null || echo "Failed to bring up $name" fi done < <(nmcli -t -f NAME,TYPE connection show)