Cleanup PcmData constructors and populate participant in events (#192)

tbarbugli · web-flow · commit 60d59d8cc650 · 2025-11-12T14:35:17.000+01:00
* cleanup/simplify methods from PcmData

* pass participant inside pcm_data
diff --git a/getstream/video/rtc/pc.py b/getstream/video/rtc/pc.py
@@ -155,10 +155,14 @@ async def on_track(track: aiortc.mediastreams.MediaStreamTrack):
             self.track_map[track.id] = (relay, track)
 
             if track.kind == "audio":
-                # Add a new subscriber for AudioTrackHandler
-                handler = AudioTrackHandler(
-                    relay.subscribe(track), lambda pcm: self.emit("audio", pcm, user)
-                )
+                from getstream.video.rtc import PcmData
+
+                # Add a new subscriber for AudioTrackHandler and attach the participant to the pcm object
+                def _emit_pcm(pcm: PcmData):
+                    pcm.participant = user
+                    self.emit("audio", pcm)
+
+                handler = AudioTrackHandler(relay.subscribe(track), _emit_pcm)
                 asyncio.create_task(handler.start())
 
             self.emit("track_added", relay.subscribe(track), user)
diff --git a/getstream/video/rtc/peer_connection.py b/getstream/video/rtc/peer_connection.py
@@ -43,8 +43,8 @@ async def setup_subscriber(self):
             )
 
             @self.subscriber_pc.on("audio")
-            async def on_audio(pcm_data, user):
-                self.connection_manager.emit("audio", pcm_data, user)
+            async def on_audio(pcm_data):
+                self.connection_manager.emit("audio", pcm_data)
 
             @self.subscriber_pc.on("track_added")
             async def on_track_added(track, user):
diff --git a/getstream/video/rtc/track_util.py b/getstream/video/rtc/track_util.py
@@ -161,7 +161,7 @@ def __init__(
                     f"Dtype mismatch: format='{format}' requires samples with dtype={expected_dtype_name}, "
                     f"but got dtype={actual_dtype_name}. "
                     f"To fix: use .to_float32() for f32 format, or ensure samples match the declared format. "
-                    f"For automatic conversion, use PcmData.from_data() instead."
+                    f"For automatic conversion, use PcmData.from_numpy() instead."
                 )
 
         self.samples: NDArray = samples
@@ -358,77 +358,75 @@ def from_bytes(
         )
 
     @classmethod
-    def from_data(
+    def from_numpy(
         cls,
-        data: Union[bytes, bytearray, memoryview, NDArray],
+        array: NDArray,
         sample_rate: int = 16000,
         format: AudioFormatType = AudioFormat.S16,
         channels: int = 1,
     ) -> "PcmData":
-        """Build from bytes or numpy arrays.
+        """Build from numpy arrays with automatic dtype/shape conversion.
 
         Args:
-            data: Input audio data (bytes or numpy array)
+            array: Input audio data as numpy array
             sample_rate: Sample rate in Hz (default: 16000)
             format: Audio format (default: AudioFormat.S16)
             channels: Number of channels (default: 1 for mono)
 
         Example:
         >>> import numpy as np
-        >>> PcmData.from_data(np.array([1, 2], np.int16), sample_rate=16000, format=AudioFormat.S16, channels=1).channels
+        >>> PcmData.from_numpy(np.array([1, 2], np.int16), sample_rate=16000, format=AudioFormat.S16, channels=1).channels
         1
         """
         # Validate format
         AudioFormat.validate(format)
-        if isinstance(data, (bytes, bytearray, memoryview)):
-            return cls.from_bytes(
-                bytes(data), sample_rate=sample_rate, format=format, channels=channels
-            )
 
-        if isinstance(data, np.ndarray):
-            arr = data
-            # Ensure dtype aligns with format
-            if format == "s16" and arr.dtype != np.int16:
-                arr = arr.astype(np.int16)
-            elif format == "f32" and arr.dtype != np.float32:
-                arr = arr.astype(np.float32)
+        if not isinstance(array, np.ndarray):
+            raise TypeError(
+                f"from_numpy() expects a numpy array, got {type(array).__name__}. "
+                f"Use from_bytes() for bytes or from_response() for API responses."
+            )
 
-            # Normalize shape to (channels, samples) for multi-channel
-            if arr.ndim == 2:
-                if arr.shape[0] == channels:
-                    samples_arr = arr
-                elif arr.shape[1] == channels:
-                    samples_arr = arr.T
-                else:
-                    # Assume first dimension is channels if ambiguous
-                    samples_arr = arr
-            elif arr.ndim == 1:
-                if channels > 1:
-                    try:
-                        frames = arr.reshape(-1, channels)
-                        samples_arr = frames.T
-                    except Exception:
-                        logger.warning(
-                            f"Could not reshape 1D array to {channels} channels; keeping mono"
-                        )
-                        channels = 1
-                        samples_arr = arr
-                else:
+        arr = array
+        # Ensure dtype aligns with format
+        if format == "s16" and arr.dtype != np.int16:
+            arr = arr.astype(np.int16)
+        elif format == "f32" and arr.dtype != np.float32:
+            arr = arr.astype(np.float32)
+
+        # Normalize shape to (channels, samples) for multi-channel
+        if arr.ndim == 2:
+            if arr.shape[0] == channels:
+                samples_arr = arr
+            elif arr.shape[1] == channels:
+                samples_arr = arr.T
+            else:
+                # Assume first dimension is channels if ambiguous
+                samples_arr = arr
+        elif arr.ndim == 1:
+            if channels > 1:
+                try:
+                    frames = arr.reshape(-1, channels)
+                    samples_arr = frames.T
+                except Exception:
+                    logger.warning(
+                        f"Could not reshape 1D array to {channels} channels; keeping mono"
+                    )
+                    channels = 1
                     samples_arr = arr
             else:
-                # Fallback
-                samples_arr = arr.reshape(-1)
-                channels = 1
-
-            return cls(
-                samples=samples_arr,
-                sample_rate=sample_rate,
-                format=format,
-                channels=channels,
-            )
+                samples_arr = arr
+        else:
+            # Fallback
+            samples_arr = arr.reshape(-1)
+            channels = 1
 
-        # Unsupported type
-        raise TypeError(f"Unsupported data type for PcmData: {type(data)}")
+        return cls(
+            samples=samples_arr,
+            sample_rate=sample_rate,
+            format=format,
+            channels=channels,
+        )
 
     @classmethod
     def from_av_frame(cls, frame: "av.AudioFrame") -> "PcmData":
@@ -885,6 +883,69 @@ def clear(self) -> None:
 
         self.samples = np.array([], dtype=dtype)
 
+    @staticmethod
+    def _calculate_sample_width(format: AudioFormatType) -> int:
+        """Calculate bytes per sample for a given format."""
+        return 2 if format == "s16" else 4 if format == "f32" else 2
+
+    @classmethod
+    def _process_iterator_chunk(
+        cls,
+        buf: bytearray,
+        frame_width: int,
+        sample_rate: int,
+        channels: int,
+        format: AudioFormatType,
+    ) -> tuple[Optional["PcmData"], bytearray]:
+        """
+        Process buffered audio data and return aligned chunk.
+
+        Returns:
+            Tuple of (PcmData chunk or None, remaining buffer)
+        """
+        aligned = (len(buf) // frame_width) * frame_width
+        if aligned:
+            chunk = bytes(buf[:aligned])
+            remaining = buf[aligned:]
+            pcm = cls.from_bytes(
+                chunk,
+                sample_rate=sample_rate,
+                channels=channels,
+                format=format,
+            )
+            return pcm, bytearray(remaining)
+        return None, buf
+
+    @classmethod
+    def _finalize_iterator_buffer(
+        cls,
+        buf: bytearray,
+        frame_width: int,
+        sample_rate: int,
+        channels: int,
+        format: AudioFormatType,
+    ) -> Optional["PcmData"]:
+        """
+        Process remaining buffer at end of iteration with padding if needed.
+
+        Returns:
+            Final PcmData chunk or None if buffer is empty
+        """
+        if not buf:
+            return None
+
+        # Pad to frame boundary
+        pad_len = (-len(buf)) % frame_width
+        if pad_len:
+            buf.extend(b"\x00" * pad_len)
+
+        return cls.from_bytes(
+            bytes(buf),
+            sample_rate=sample_rate,
+            channels=channels,
+            format=format,
+        )
+
     @classmethod
     def from_response(
         cls,
@@ -926,38 +987,32 @@ def from_response(
         if hasattr(response, "__aiter__"):
 
             async def _agen():
-                width = 2 if format == "s16" else 4 if format == "f32" else 2
+                width = cls._calculate_sample_width(format)
                 frame_width = width * max(1, channels)
                 buf = bytearray()
+
                 async for item in response:
                     if isinstance(item, PcmData):
                         yield item
                         continue
+
                     data = getattr(item, "data", item)
                     if not isinstance(data, (bytes, bytearray, memoryview)):
                         raise TypeError("Async iterator yielded unsupported item type")
+
                     buf.extend(bytes(data))
-                    aligned = (len(buf) // frame_width) * frame_width
-                    if aligned:
-                        chunk = bytes(buf[:aligned])
-                        del buf[:aligned]
-                        yield cls.from_bytes(
-                            chunk,
-                            sample_rate=sample_rate,
-                            channels=channels,
-                            format=format,
-                        )
-                # pad remainder, if any
-                if buf:
-                    pad_len = (-len(buf)) % frame_width
-                    if pad_len:
-                        buf.extend(b"\x00" * pad_len)
-                    yield cls.from_bytes(
-                        bytes(buf),
-                        sample_rate=sample_rate,
-                        channels=channels,
-                        format=format,
+                    chunk, buf = cls._process_iterator_chunk(
+                        buf, frame_width, sample_rate, channels, format
                     )
+                    if chunk:
+                        yield chunk
+
+                # Handle remainder
+                final_chunk = cls._finalize_iterator_buffer(
+                    buf, frame_width, sample_rate, channels, format
+                )
+                if final_chunk:
+                    yield final_chunk
 
             return _agen()
 
@@ -967,37 +1022,32 @@ async def _agen():
         ):
 
             def _gen():
-                width = 2 if format == "s16" else 4 if format == "f32" else 2
+                width = cls._calculate_sample_width(format)
                 frame_width = width * max(1, channels)
                 buf = bytearray()
+
                 for item in response:
                     if isinstance(item, PcmData):
                         yield item
                         continue
+
                     data = getattr(item, "data", item)
                     if not isinstance(data, (bytes, bytearray, memoryview)):
                         raise TypeError("Iterator yielded unsupported item type")
+
                     buf.extend(bytes(data))
-                    aligned = (len(buf) // frame_width) * frame_width
-                    if aligned:
-                        chunk = bytes(buf[:aligned])
-                        del buf[:aligned]
-                        yield cls.from_bytes(
-                            chunk,
-                            sample_rate=sample_rate,
-                            channels=channels,
-                            format=format,
-                        )
-                if buf:
-                    pad_len = (-len(buf)) % frame_width
-                    if pad_len:
-                        buf.extend(b"\x00" * pad_len)
-                    yield cls.from_bytes(
-                        bytes(buf),
-                        sample_rate=sample_rate,
-                        channels=channels,
-                        format=format,
+                    chunk, buf = cls._process_iterator_chunk(
+                        buf, frame_width, sample_rate, channels, format
                     )
+                    if chunk:
+                        yield chunk
+
+                # Handle remainder
+                final_chunk = cls._finalize_iterator_buffer(
+                    buf, frame_width, sample_rate, channels, format
+                )
+                if final_chunk:
+                    yield final_chunk
 
             return _gen()
 
diff --git a/tests/rtc/test_pcm_data.py b/tests/rtc/test_pcm_data.py

Original file line number	Diff line number	Diff line change
`@@ -43,8 +43,8 @@ async def setup_subscriber(self):`
`43`	`43`	`)`
`44`	`44`
`45`	`45`	`@self.subscriber_pc.on("audio")`
`46`		`- async def on_audio(pcm_data, user):`
`47`		`- self.connection_manager.emit("audio", pcm_data, user)`
	`46`	`+ async def on_audio(pcm_data):`
	`47`	`+ self.connection_manager.emit("audio", pcm_data)`
`48`	`48`
`49`	`49`	`@self.subscriber_pc.on("track_added")`
`50`	`50`	`async def on_track_added(track, user):`