livekit · phpmaple · Oct 18, 2024 · Oct 18, 2024
diff --git a/.changeset/silly-dryers-admire.md b/.changeset/silly-dryers-admire.md
@@ -0,0 +1,5 @@
+---
+"livekit-agents": patch
+---
+
+Add audio output post processing
diff --git a/livekit-agents/livekit/agents/multimodal/multimodal_agent.py b/livekit-agents/livekit/agents/multimodal/multimodal_agent.py
@@ -2,7 +2,7 @@
 
 import asyncio
 from dataclasses import dataclass
-from typing import Callable, Literal, Protocol
+from typing import AsyncIterable,Awaitable, Callable, Literal, Protocol
 
 import aiohttp
 from livekit import rtc
@@ -92,6 +92,10 @@ def __init__(
         self._update_state_task: asyncio.Task | None = None
         self._http_session: aiohttp.ClientSession | None = None
 
+        # audio output post processing
+        self._audio_processor: Callable[[AsyncIterable[bytes]], Awaitable[AsyncIterable[bytes]]] | None = None
+
+
     @property
     def vad(self) -> vad.VAD | None:
         return self._vad
@@ -104,6 +108,12 @@ def fnc_ctx(self) -> llm.FunctionContext | None:
     def fnc_ctx(self, value: llm.FunctionContext | None) -> None:
         self._session.fnc_ctx = value
 
+    def set_audio_processor(self, processor: Callable[[AsyncIterable[bytes]], Awaitable[AsyncIterable[bytes]]]):
+        """
+        Set a custom audio processor function.
+        """
+        self._audio_processor = processor
+
     def start(
         self, room: rtc.Room, participant: rtc.RemoteParticipant | str | None = None
     ) -> None:
@@ -145,6 +155,10 @@ def _on_content_added(message: realtime.RealtimeContent):
                 hyphenate_word=self._opts.transcription.hyphenate_word,
             )
 
+            audio_stream = message.audio_stream
+            if self._audio_processor:
+                audio_stream = self._audio_processor(audio_stream)
+
             self._playing_handle = self._agent_playout.play(
                 item_id=message.item_id,
                 content_index=message.content_index,