support for rime arcana model

2025-04-26 15:59:25 -07:00
parent a995cf81b6
commit b25f3b2ed2
2 changed files with 13 additions and 1 deletions
--- a/examples/foundational/07q-interruptible-rime-http.py
+++ b/examples/foundational/07q-interruptible-rime-http.py
@@ -44,7 +44,8 @@ async def run_bot(webrtc_connection: SmallWebRTCConnection, _: argparse.Namespac

        tts = RimeHttpTTSService(
            api_key=os.getenv("RIME_API_KEY", ""),
-            voice_id="rex",
+            voice_id="luna",
+            model="arcana",
            aiohttp_session=session,
        )

--- a/src/pipecat/services/rime/tts.py
+++ b/src/pipecat/services/rime/tts.py
@@ -400,6 +400,13 @@ class RimeHttpTTSService(TTSService):
        payload["modelId"] = self._model_name
        payload["samplingRate"] = self.sample_rate

+        # Arcana does not support PCM audio
+        if payload["modelId"] == "arcana":
+            headers["Accept"] = "audio/wav"
+            need_to_strip_wav_header = True
+        else:
+            need_to_strip_wav_header = False
+
        try:
            await self.start_ttfb_metrics()

@@ -420,6 +427,10 @@ class RimeHttpTTSService(TTSService):
                CHUNK_SIZE = 1024

                async for chunk in response.content.iter_chunked(CHUNK_SIZE):
+                    if need_to_strip_wav_header and chunk.startswith(b"RIFF"):
+                        chunk = chunk[44:]
+                        need_to_strip_wav_header = False
+
                    if len(chunk) > 0:
                        await self.stop_ttfb_metrics()
                        frame = TTSAudioRawFrame(chunk, self.sample_rate, 1)