livekit · chenosaurus · Sep 8, 2025 · Sep 9, 2025 · Sep 9, 2025 · Sep 10, 2025
diff --git a/examples/local_audio/full_duplex.py b/examples/local_audio/full_duplex.py
@@ -0,0 +1,147 @@
+import os
+import asyncio
+import logging
+from dotenv import load_dotenv, find_dotenv
+
+from livekit import api, rtc
+
+
+async def main() -> None:
+    logging.basicConfig(level=logging.INFO)
+
+    # Load environment variables from a .env file if present
+    load_dotenv(find_dotenv())
+
+    url = os.getenv("LIVEKIT_URL")
+    api_key = os.getenv("LIVEKIT_API_KEY")
+    api_secret = os.getenv("LIVEKIT_API_SECRET")
+    if not url or not api_key or not api_secret:
+        raise RuntimeError("LIVEKIT_URL and LIVEKIT_TOKEN must be set in env")
+
+    room = rtc.Room()
+
+    devices = rtc.MediaDevices()
+
+    # Open microphone with AEC and prepare a player for remote audio feeding AEC reverse stream
+    mic = devices.open_input(enable_aec=True)
+    player = devices.open_output(apm_for_reverse=mic.apm)
+
+    # Mixer for all remote audio streams
+    mixer = rtc.AudioMixer(sample_rate=48000, num_channels=1)
+
+    # Track stream bookkeeping for cleanup
+    streams_by_pub: dict[str, rtc.AudioStream] = {}
+    streams_by_participant: dict[str, set[rtc.AudioStream]] = {}
+
+    async def _remove_stream(
+        stream: rtc.AudioStream, participant_sid: str | None = None, pub_sid: str | None = None
+    ) -> None:
+        try:
+            mixer.remove_stream(stream)
+        except Exception:
+            pass
+        try:
+            await stream.aclose()
+        except Exception:
+            pass
+        if participant_sid and participant_sid in streams_by_participant:
+            streams_by_participant.get(participant_sid, set()).discard(stream)
+            if not streams_by_participant.get(participant_sid):
+                streams_by_participant.pop(participant_sid, None)
+        if pub_sid is not None:
+            streams_by_pub.pop(pub_sid, None)
+
+    def on_track_subscribed(
+        track: rtc.Track,
+        publication: rtc.RemoteTrackPublication,
+        participant: rtc.RemoteParticipant,
+    ):
+        if track.kind == rtc.TrackKind.KIND_AUDIO:
+            stream = rtc.AudioStream(track, sample_rate=48000, num_channels=1)
+            streams_by_pub[publication.sid] = stream
+            streams_by_participant.setdefault(participant.sid, set()).add(stream)
+            mixer.add_stream(stream)
+            logging.info("subscribed to audio from %s", participant.identity)
+
+    room.on("track_subscribed", on_track_subscribed)
+
+    def on_track_unsubscribed(
+        track: rtc.Track,
+        publication: rtc.RemoteTrackPublication,
+        participant: rtc.RemoteParticipant,
+    ):
+        stream = streams_by_pub.get(publication.sid)
+        if stream is not None:
+            asyncio.create_task(_remove_stream(stream, participant.sid, publication.sid))
+            logging.info("unsubscribed from audio of %s", participant.identity)
+
+    room.on("track_unsubscribed", on_track_unsubscribed)
+
+    def on_track_unpublished(
+        publication: rtc.RemoteTrackPublication, participant: rtc.RemoteParticipant
+    ):
+        stream = streams_by_pub.get(publication.sid)
+        if stream is not None:
+            asyncio.create_task(_remove_stream(stream, participant.sid, publication.sid))
+            logging.info("track unpublished: %s from %s", publication.sid, participant.identity)
+
+    room.on("track_unpublished", on_track_unpublished)
+
+    def on_participant_disconnected(participant: rtc.RemoteParticipant):
+        streams = list(streams_by_participant.pop(participant.sid, set()))
+        for stream in streams:
+            # Best-effort discover publication sid
+            pub_sid = None
+            for k, v in list(streams_by_pub.items()):
+                if v is stream:
+                    pub_sid = k
+                    break
+            asyncio.create_task(_remove_stream(stream, participant.sid, pub_sid))
+        logging.info("participant disconnected: %s", participant.identity)
+
+    room.on("participant_disconnected", on_participant_disconnected)
+
+    token = (
+        api.AccessToken(api_key, api_secret)
+        .with_identity("local-audio")
+        .with_name("Local Audio")
+        .with_grants(
+            api.VideoGrants(
+                room_join=True,
+                room="local-audio",
+            )
+        )
+        .to_jwt()
+    )
+
+    try:
+        await room.connect(url, token)
+        logging.info("connected to room %s", room.name)
+
+        # Publish microphone
+        track = rtc.LocalAudioTrack.create_audio_track("mic", mic.source)
+        pub_opts = rtc.TrackPublishOptions()
+        pub_opts.source = rtc.TrackSource.SOURCE_MICROPHONE
+        await room.local_participant.publish_track(track, pub_opts)
+        logging.info("published local microphone")
+
+        # Start playing mixed remote audio
+        asyncio.create_task(player.play(mixer))
+
+        # Run until Ctrl+C
+        while True:
+            await asyncio.sleep(1)
+    except KeyboardInterrupt:
+        pass
+    finally:
+        await mic.aclose()
+        await mixer.aclose()
+        await player.aclose()
+        try:
+            await room.disconnect()
+        except Exception:
+            pass
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/examples/local_audio/publish_mic.py b/examples/local_audio/publish_mic.py
@@ -0,0 +1,66 @@
+import os
+import asyncio
+import logging
+from dotenv import load_dotenv, find_dotenv
+
+from livekit import api, rtc
+
+
+async def main() -> None:
+    logging.basicConfig(level=logging.INFO)
+
+    # Load environment variables from a .env file if present
+    load_dotenv(find_dotenv())
+
+    url = os.getenv("LIVEKIT_URL")
+    api_key = os.getenv("LIVEKIT_API_KEY")
+    api_secret = os.getenv("LIVEKIT_API_SECRET")
+    if not url or not api_key or not api_secret:
+        raise RuntimeError(
+            "LIVEKIT_URL and LIVEKIT_API_KEY and LIVEKIT_API_SECRET must be set in env"
+        )
+
+    room = rtc.Room()
+
+    # Create media devices helper and open default microphone with AEC enabled
+    devices = rtc.MediaDevices()
+    mic = devices.open_input(enable_aec=True)
+
+    token = (
+        api.AccessToken(api_key, api_secret)
+        .with_identity("local-audio")
+        .with_name("Local Audio")
+        .with_grants(
+            api.VideoGrants(
+                room_join=True,
+                room="local-audio",
+            )
+        )
+        .to_jwt()
+    )
+
+    try:
+        await room.connect(url, token)
+        logging.info("connected to room %s", room.name)
+
+        track = rtc.LocalAudioTrack.create_audio_track("mic", mic.source)
+        pub_opts = rtc.TrackPublishOptions()
+        pub_opts.source = rtc.TrackSource.SOURCE_MICROPHONE
+        await room.local_participant.publish_track(track, pub_opts)
+        logging.info("published local microphone")
+
+        # Run until Ctrl+C
+        while True:
+            await asyncio.sleep(1)
+    except KeyboardInterrupt:
+        pass
+    finally:
+        await mic.aclose()
+        try:
+            await room.disconnect()
+        except Exception:
+            pass
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/livekit-rtc/livekit/rtc/__init__.py b/livekit-rtc/livekit/rtc/__init__.py
@@ -90,6 +90,13 @@
 from .audio_resampler import AudioResampler, AudioResamplerQuality
 from .audio_mixer import AudioMixer
 from .apm import AudioProcessingModule
+
+try:
+    from .media_devices import MediaDevices as MediaDevices
+
+    _HAS_MEDIA_DEVICES = True
+except Exception:  # pragma: no cover - optional dependency (sounddevice)
+    _HAS_MEDIA_DEVICES = False
 from .utils import combine_audio_frames
 from .rpc import RpcError, RpcInvocationData
 from .synchronizer import AVSynchronizer
@@ -179,3 +186,7 @@
     "AudioProcessingModule",
     "__version__",
 ]
+
+# add MediaDevices if available
+if _HAS_MEDIA_DEVICES:
+    __all__.append("MediaDevices")
diff --git a/livekit-rtc/livekit/rtc/audio_mixer.py b/livekit-rtc/livekit/rtc/audio_mixer.py
@@ -184,6 +184,10 @@ async def _get_contribution(
             except StopAsyncIteration:
                 exhausted = True
                 break
+            # AudioStream may yield either AudioFrame or AudioFrameEvent; unwrap if needed
+            if hasattr(frame, "frame"):
+                frame = frame.frame  # type: ignore[assignment]
+
             new_data = np.frombuffer(frame.data.tobytes(), dtype=np.int16).reshape(
                 -1, self._num_channels
             )