luxonis · Serafadam · Mar 7, 2024 · Mar 4, 2024 · Mar 4, 2024 · Mar 7, 2024
diff --git a/Dockerfile b/Dockerfile
@@ -26,7 +26,7 @@ RUN apt-get update && apt-get -y install --no-install-recommends \
     libsndfile1-dev \
     libsndfile1
 
-RUN pip3 install openai
+RUN pip3 install openai ffmpeg-python
 
 ENV WS=/ws
 RUN mkdir -p $WS/src

diff --git a/rae_hw/src/peripherals/speakers.cpp b/rae_hw/src/peripherals/speakers.cpp
@@ -133,7 +133,7 @@ void SpeakersNode::play_wav(const char* wav_file) {
     int32_t* buffer_wav = new int32_t[BUFFER_SIZE * sfinfo.channels];  // Use int32_t for 32-bit format
     sf_count_t readCount;
 
-    const float gain = 64.0f;  // Adjust this factor for desired gain
+    const float gain = 16.0f;  // Adjust this factor for desired gain
 
     while((readCount = sf_readf_int(file, buffer_wav, BUFFER_SIZE)) > 0) {
         // Apply gain to the samples

diff --git a/rae_sdk/rae_sdk/robot/audio.py b/rae_sdk/rae_sdk/robot/audio.py
@@ -2,7 +2,8 @@
 import random
 import logging as log
 from ament_index_python import get_package_share_directory
-
+import base64
+import ffmpeg
 from rae_msgs.srv import PlayAudio
 
 
@@ -38,6 +39,31 @@ def play_audio_file(self, audio_file_path):
         req.file_location = audio_file_path
         res = self._ros_interface.call_async_srv('/play_audio', req)
         return res
+
+    def save_recorded_sound(self, audio_data, output_file="/app/mic_recording.wav"):
+        """
+        Decode the Base64 audio data and save it as a WAV file.
+
+        Attributes
+        ----------
+            audio_data (str): Base64 encoded audio data.
+            output_file (str, optional): Path to save the WAV file. Defaults to "/app/output.wav".
+
+
+        """
+        # Decode Base64 data
+        binary_data = base64.b64decode(audio_data)
+
+        # Convert WebM to WAV using ffmpeg
+        output, _ = (
+            ffmpeg.input('pipe:', format='webm')
+            .output('pipe:', format='wav')
+            .run(input=binary_data, capture_stdout=True, capture_stderr=True)
+        )
+
+        # Write the output to the specified WAV file
+        with open(output_file, 'wb') as wave_file:
+            wave_file.write(output)
 
     def honk(self):
         horn_path = os.path.join(self._assets_path, 'sfx', 'horn.mp3')