134ms constant delay, no build up, seems to be no glitches, bang bang control.

2026-03-30 14:45:25 +02:00
parent cdfecaf5eb
commit cf69ad2957
1 changed files with 65 additions and 126 deletions
@@ -140,7 +140,7 @@ class AlsaArecordAudioInput(audio_io.AudioInput):


 class PyAlsaAudioInput(audio_io.ThreadedAudioInput):
-    """PyALSA audio input with callback thread and ring buffer - supports mono/stereo."""
+    """PyALSA audio input with non-blocking reads - supports mono/stereo."""

    def __init__(self, device, pcm_format: audio_io.PcmFormat):
        super().__init__()
@@ -149,28 +149,18 @@ class PyAlsaAudioInput(audio_io.ThreadedAudioInput):
            self._device = 'default' if self._device == '0' else f'hw:{self._device}'
        self._pcm_format = pcm_format
        self._pcm = None
-        self._ring_buffer = deque()
-        self._ring_lock = threading.Lock()
-        self._running = False
-        self._callback_thread = None
        self._actual_channels = None
        self._periodsize = None
-        self._buffer_log_last_ts = time.monotonic()
-        self._buffer_log_max_last_sec = 0
+        self._hw_channels = None
+        self._first_read = True

    def _open(self) -> audio_io.PcmFormat:
-        # ========== LATENCY CONFIGURATION ==========
-        # Adjust these parameters to tune latency vs stability
-        ALSA_PERIODSIZE = 96      # Samples per ALSA read (240@48kHz = 5ms, 120 = 2.5ms, 96 = 2ms)
-        ALSA_PERIODS = 2           # Number of periods in ALSA buffer (lower = less latency, more risk of underrun)
-        # Ring buffer: keep only 3 periods max to minimize latency (safety margin only)
-        # ===========================================
+        ALSA_PERIODSIZE = 240
+        ALSA_PERIODS = 4
        
        requested_rate = int(self._pcm_format.sample_rate)
        requested_channels = int(self._pcm_format.channels)
        self._periodsize = ALSA_PERIODSIZE
-        # Max ring buffer = 3 periods worth of data (tight coupling, minimal latency)
-        self._max_buffer_bytes = ALSA_PERIODSIZE * 60 * 2 * requested_channels
        
        self._pcm = alsaaudio.PCM(
            type=alsaaudio.PCM_CAPTURE,
@@ -184,19 +174,16 @@ class PyAlsaAudioInput(audio_io.ThreadedAudioInput):
        actual_rate = self._pcm.setrate(requested_rate)
        self._pcm.setperiodsize(ALSA_PERIODSIZE)
        
-        ring_buf_samples = self._max_buffer_bytes // (2 * requested_channels)
-        ring_buf_ms = (ring_buf_samples / actual_rate) * 1000
-        logging.info("PyALSA: device=%s rate=%d ch=%d periodsize=%d (%.1fms) periods=%d ring_buf=%d samples (%.1fms)", 
+        logging.info("PyALSA: device=%s rate=%d ch=%d periodsize=%d (%.1fms) periods=%d mode=NONBLOCK", 
                     self._device, actual_rate, requested_channels, ALSA_PERIODSIZE, 
-                     (ALSA_PERIODSIZE / actual_rate) * 1000, ALSA_PERIODS, ring_buf_samples, ring_buf_ms)
+                     (ALSA_PERIODSIZE / actual_rate) * 1000, ALSA_PERIODS)
        
        if actual_rate != requested_rate:
            logging.warning("PyALSA: Sample rate mismatch! requested=%d actual=%d", requested_rate, actual_rate)
        
        self._actual_channels = requested_channels
-        self._running = True
-        self._callback_thread = threading.Thread(target=self._capture_loop, daemon=True)
-        self._callback_thread.start()
+
+        self._bang_bang = 0
        
        return audio_io.PcmFormat(
            audio_io.PcmFormat.Endianness.LITTLE,
@@ -205,128 +192,80 @@ class PyAlsaAudioInput(audio_io.ThreadedAudioInput):
            requested_channels,
        )

-    def _capture_loop(self):
-        first_read = True
-        hw_channels = None
-        while self._running:
+    def _read(self, frame_size: int) -> bytes:
+        bytes_needed = frame_size * 2 * self._actual_channels
+        result = b''
+        
+        try:
+            length, data = self._pcm.read_sw(frame_size + self._bang_bang)
+            avail = self._pcm.avail()
+            self._bang_bang = 1 if avail > 50 else 0
+            logging.info("PyALSA: read length=%d, data length=%d, avail=%d, bang_bang=%d", length, len(data), avail, self._bang_bang)
+
+            if length > 0:
+                if self._first_read:
+                    expected_mono = self._periodsize * 2
+                    expected_stereo = self._periodsize * 2 * 2
+                    # self._hw_channels = 2 if len(data) == expected_stereo else 1
+                    self._hw_channels = 2  # TODO fix stereo detection, on first read might detect 0 data
+                    logging.info("PyALSA first read: bytes=%d detected_hw_channels=%d requested_channels=%d", 
+                                len(data), self._hw_channels, self._actual_channels)
+                    self._first_read = False
+                
+                if self._hw_channels == 2 and self._actual_channels == 1:
+                    pcm_stereo = np.frombuffer(data, dtype=np.int16)
+                    pcm_mono = pcm_stereo[::2]
+                    data = pcm_mono.tobytes()
+                
+                result += data
+            else:
+                logging.info("PyALSA: No data read from ALSA")
+        except alsaaudio.ALSAAudioError as e:
+            logging.info("PyALSA: ALSA read error: %s", e)
+
+        
+        logging.info("PyALSA: result length=%d, frame_size=%d", len(result), frame_size)
+
+        if len(result) < bytes_needed:
+            result += b'\x00' * (bytes_needed - len(result))
+            
+        return result[:bytes_needed]
+
+    def _read2(self, frame_size: int) -> bytes:
+        bytes_needed = frame_size * 2 * self._actual_channels
+        result = b''
+        
+        while len(result) < bytes_needed:
            try:
                length, data = self._pcm.read()
                if length > 0:
-                    if first_read:
+                    if self._first_read:
                        expected_mono = self._periodsize * 2
                        expected_stereo = self._periodsize * 2 * 2
-                        hw_channels = 2 if len(data) == expected_stereo else 1
-                        logging.info("PyALSA first capture: bytes=%d detected_hw_channels=%d requested_channels=%d", 
-                                    len(data), hw_channels, self._actual_channels)
-                        first_read = False
+                        self._hw_channels = 2 if len(data) == expected_stereo else 1
+                        logging.info("PyALSA first read: bytes=%d detected_hw_channels=%d requested_channels=%d", 
+                                    len(data), self._hw_channels, self._actual_channels)
+                        self._first_read = False
                    
-                    # Convert stereo hardware to mono if needed
-                    if hw_channels == 2 and self._actual_channels == 1:
+                    if self._hw_channels == 2 and self._actual_channels == 1:
                        pcm_stereo = np.frombuffer(data, dtype=np.int16)
                        pcm_mono = pcm_stereo[::2]
                        data = pcm_mono.tobytes()
                    
-                    with self._ring_lock:
-                        self._ring_buffer.append(data)
-                        # total_bytes = sum(len(chunk) for chunk in self._ring_buffer)
-                        # # logging.info("Ringbuffer: bytes=%d", total_bytes) 
-                        # while total_bytes > self._max_buffer_bytes:
-                        #     self._ring_buffer.popleft()
-                        #     logging.error("Ringbuffer: OVERFLOW") 
-                        #     total_bytes = sum(len(chunk) for chunk in self._ring_buffer)
-            except:
-                if self._running:
+                    result += data
+                else:
                    break
-
-    # def _read(self, frame_size: int) -> bytes:
-    #     bytes_needed = frame_size * 2
-    #     result = b''
-
-    #     buffer_not_empty = True
-    #     while (len(result) < bytes_needed) and buffer_not_empty:
-    #         with self._ring_lock:
-    #             buffer_size = sum(len(chunk) for chunk in self._ring_buffer)
-    #             self._buffer_log_max_last_sec = max(self._buffer_log_max_last_sec, buffer_size)
-    #             now = time.monotonic()
-    #             if now - self._buffer_log_last_ts >= 1.0:
-    #                 logging.info(
-    #                     "Buffer size (bytes): current=%d max_last_sec=%d",
-    #                     buffer_size,
-    #                     self._buffer_log_max_last_sec,
-    #                 )
-    #                 self._buffer_log_last_ts = now
-    #                 self._buffer_log_max_last_sec = 0
-    #             if self._ring_buffer and buffer_size > bytes_needed :
-    #                 chunk = self._ring_buffer.popleft()
-    #                 needed = bytes_needed - len(result)
-    #                 if len(chunk) <= needed:
-    #                     result += chunk
-    #                 else:
-    #                     result += chunk[:needed]
-    #                     self._ring_buffer.appendleft(chunk[needed:])
-    #             else:
-    #                 # Ring buffer empty - release lock and wait a bit
-    #                 pass
-            
-    #         if len(result) < bytes_needed:
-    #             # Don't busy-wait - sleep briefly to let capture thread fill buffer
-    #             time.sleep(0.001)  # 0.1ms
+            except alsaaudio.ALSAAudioError:
+                break
        
-    #     return result
-
-    def _read(self, frame_size: int) -> bytes:
-        bytes_needed = frame_size * 2
-        result = b''
-
-        if self._ring_buffer:
-            buffer_size = sum(len(chunk) for chunk in self._ring_buffer)
-        else:
-            buffer_size = 0
-        buffer_not_empty = (buffer_size != 0)
-        with self._ring_lock:
-            while (len(result) < bytes_needed) and buffer_not_empty:
-                chunk = self._ring_buffer.popleft()
-                needed = bytes_needed - len(result)
-                if len(chunk) <= needed:
-                    result += chunk
-                else:
-                    result += chunk[:needed]
-                    self._ring_buffer.appendleft(chunk[needed:])
-                if self._ring_buffer:
-                    buffer_size = sum(len(chunk) for chunk in self._ring_buffer)
-                    self._buffer_log_max_last_sec = max(self._buffer_log_max_last_sec, buffer_size)
-                    now = time.monotonic()
-                    if now - self._buffer_log_last_ts >= 1.0:
-                        logging.info(
-                            "Buffer size (bytes): current=%d max_last_sec=%d",
-                            buffer_size,
-                            self._buffer_log_max_last_sec,
-                        )
-                        self._buffer_log_last_ts = now
-                        self._buffer_log_max_last_sec = 0
-                else:
-                    buffer_size = 0
-                buffer_not_empty = (buffer_size != 0)
-        #append to bytesneeded
        if len(result) < bytes_needed:
            result += b'\x00' * (bytes_needed - len(result))
            
-        return result
+        return result[:bytes_needed]

-    # def _read(self, frame_size: int) -> bytes:
-    #     bytes_needed = frame_size * 2
-    #     result = b''
-    #     # Generate 500Hz sine wave
-    #     samples = []
-    #     for i in range(frame_size):
-    #         sample = int(np.sin(2 * np.pi * 500 * i / 48000) * 32767)
-    #         samples.append(sample)
-    #     return struct.pack('h' * len(samples), *samples)
+  

    def _close(self) -> None:
-        self._running = False
-        if self._callback_thread:
-            self._callback_thread.join(timeout=1.0)
        if self._pcm:
            self._pcm.close()
            self._pcm = None