Spaces:

pollen-robotics
/

reachy_mini_conversation_app

Running

Remi commited on Nov 17

Commit

b7e5088

unverified ·

2 Parent(s): 601cd23 ba448b6

Merge pull request #102 from pollen-robotics/fix/resample-overhead

Files changed (1) hide show

src/reachy_mini_conversation_app/console.py CHANGED Viewed

@@ -8,8 +8,8 @@ import asyncio
 import logging
 from typing import List
-import librosa
 from fastrtc import AdditionalOutputs, audio_to_int16, audio_to_float32
 from reachy_mini import ReachyMini
 from reachy_mini_conversation_app.openai_realtime import OpenaiRealtimeHandler
@@ -30,6 +30,11 @@ class LocalStream:
         # Allow the handler to flush the player queue when appropriate.
         self.handler._clear_queue = self.clear_audio_queue
     def launch(self) -> None:
         """Start the recorder/player and run the async processing loops."""
         self._stop_event.clear()
@@ -110,7 +115,7 @@ class LocalStream:
                 audio_frame_float = audio_to_float32(audio_frame.squeeze())
                 if input_sample_rate != device_sample_rate:
-                    audio_frame_float = librosa.resample(
                         audio_frame_float,
                         orig_sr=input_sample_rate,
                         target_sr=device_sample_rate,

 import logging
 from typing import List
 from fastrtc import AdditionalOutputs, audio_to_int16, audio_to_float32
+from librosa import resample
 from reachy_mini import ReachyMini
 from reachy_mini_conversation_app.openai_realtime import OpenaiRealtimeHandler
         # Allow the handler to flush the player queue when appropriate.
         self.handler._clear_queue = self.clear_audio_queue
+        # Hack to avoid the first lenghty call to resample at runtime.
+        # This is likely caused by cache initialization overhead.
+        import numpy as np
+        resample(np.array([0.0]), orig_sr=1, target_sr=1)
     def launch(self) -> None:
         """Start the recorder/player and run the async processing loops."""
         self._stop_event.clear()
                 audio_frame_float = audio_to_float32(audio_frame.squeeze())
                 if input_sample_rate != device_sample_rate:
+                    audio_frame_float = resample(
                         audio_frame_float,
                         orig_sr=input_sample_rate,
                         target_sr=device_sample_rate,