ShipBit
diff --git a/‎audio_samples/Brown_Noise.wav
-6.91 MB b/‎audio_samples/Brown_Noise.wav
-6.91 MB
diff --git a/‎audio_samples/Pink_Noise.wav
-6.91 MB b/‎audio_samples/Pink_Noise.wav
-6.91 MB
diff --git a/‎audio_samples/Radio_Noise.wav
-6.86 MB b/‎audio_samples/Radio_Noise.wav
-6.86 MB
diff --git a/‎audio_samples/Radio_Static.wav
-1020 KB b/‎audio_samples/Radio_Static.wav
-1020 KB
diff --git a/‎audio_samples/Radio_Static_Beep.wav
-38.5 KB b/‎audio_samples/Radio_Static_Beep.wav
-38.5 KB
diff --git a/‎audio_samples/White_Noise.wav
-6.91 MB b/‎audio_samples/White_Noise.wav
-6.91 MB
diff --git a/‎audio_samples/low_quality_radio.wav
-518 KB b/‎audio_samples/low_quality_radio.wav
-518 KB
diff --git a/‎providers/elevenlabs.py
+9-1 b/‎providers/elevenlabs.py
+9-1
diff --git a/‎services/audio_player.py
+201-18 b/‎services/audio_player.py
+201-18
@@ -3,7 +3,7 @@
     GenerationOptions,
     PlaybackOptions,
 )
-from api.enums import ElevenlabsModel, WingmanInitializationErrorType
+from api.enums import ElevenlabsModel, SoundEffect, WingmanInitializationErrorType
 from api.interface import ElevenlabsConfig, SoundConfig, WingmanInitializationError
 from services.audio_player import AudioPlayer
 from services.secret_keeper import SecretKeeper
@@ -53,6 +53,10 @@ async def play_audio(
         def notify_playback_finished():
             audio_player.playback_events.unsubscribe("finished", playback_finished)
 
+            contains_high_end_radio = SoundEffect.HIGH_END_RADIO in sound_config.effects
+            if contains_high_end_radio:
+                audio_player.play_wav("Radio_Static_Beep.wav")
+
             if sound_config.play_beep:
                 audio_player.play_wav("beep.wav")
             elif sound_config.play_beep_apollo:
@@ -68,6 +72,10 @@ def notify_playback_started():
             elif sound_config.play_beep_apollo:
                 audio_player.play_wav("Apollo_Beep.wav")
 
+            contains_high_end_radio = SoundEffect.HIGH_END_RADIO in sound_config.effects
+            if contains_high_end_radio:
+                audio_player.play_wav("Radio_Static_Beep.wav")
+
             WebSocketUser.ensure_async(
                 audio_player.notify_playback_started(wingman_name)
             )
 
@@ -7,9 +7,14 @@
 import soundfile as sf
 import sounddevice as sd
 from scipy.signal import resample
+from api.enums import SoundEffect
 from api.interface import SoundConfig
 from services.pub_sub import PubSub
-from services.sound_effects import get_sound_effects
+from services.sound_effects import (
+    get_additional_layer_file,
+    get_azure_workaround_gain_boost,
+    get_sound_effects,
+)
 
 
 class AudioPlayer:
@@ -29,6 +34,9 @@ def __init__(
         self.stream_event = PubSub()
         self.on_playback_started = on_playback_started
         self.on_playback_finished = on_playback_finished
+        self.sample_dir = path.join(
+            path.abspath(path.dirname(__file__)), "../audio_samples"
+        )
 
     def set_event_loop(self, loop: asyncio.AbstractEventLoop):
         self.event_loop = loop
@@ -37,14 +45,51 @@ def start_playback(self, audio, sample_rate, channels, finished_callback):
         def callback(outdata, frames, time, status):
             nonlocal playhead
             chunksize = frames * channels
-            current_chunk = audio[playhead : playhead + chunksize].reshape(-1, channels)
-            if current_chunk.shape[0] < frames:
-                outdata[: current_chunk.shape[0]] = current_chunk
-                outdata[current_chunk.shape[0] :] = 0  # Fill the rest with zeros
-                raise sd.CallbackStop  # Stop the stream after playing the current chunk
+
+            if playhead * channels >= len(audio):
+                if np.issubdtype(outdata.dtype, np.floating):
+                    outdata.fill(0.0)  # Fill with zero for floats
+                else:
+                    outdata[:] = bytes(
+                        len(outdata)
+                    )  # Fill with zeros for buffer of int types
+                raise sd.CallbackStop
+
+            end = min(playhead + chunksize, len(audio) // channels)
+            current_chunk = audio[playhead:end]
+
+            if channels > 1 and current_chunk.ndim == 1:
+                current_chunk = np.tile(current_chunk[:, None], (1, channels)).flatten()
+
+            # It's critical that current_chunk matches the number of elements in outdata
+            required_length = frames * channels
+            current_chunk = current_chunk[:required_length]
+
+            if len(current_chunk) < required_length:
+                current_chunk = np.pad(
+                    current_chunk, (0, required_length - len(current_chunk)), "constant"
+                )
+
+            if outdata.dtype == np.float32 or outdata.dtype == np.float64:
+                outdata[:required_length] = current_chunk.astype(outdata.dtype).reshape(
+                    outdata.shape
+                )
             else:
-                outdata[:] = current_chunk
-                playhead += chunksize  # Advance the playhead
+                current_chunk_bytes = current_chunk.astype(outdata.dtype).tobytes()
+                outdata[: len(current_chunk_bytes)] = current_chunk_bytes[
+                    : len(outdata)
+                ]
+
+            playhead += chunksize
+
+            if end >= len(audio):
+                if np.issubdtype(outdata.dtype, np.floating):
+                    outdata.fill(0.0)  # Fill with zero for floats
+                else:
+                    outdata[:] = bytes(
+                        len(outdata)
+                    )  # Fill with zeros buffer of int types
+                raise sd.CallbackStop
 
         playhead = 0  # Tracks the position in the audio
 
@@ -74,6 +119,7 @@ async def play_with_effects(
         input_data: bytes | tuple,
         config: SoundConfig,
         wingman_name: str = None,
+        mixed_layer_gain_boost_db: float = -9.0,
     ):
         if isinstance(input_data, bytes):
             audio, sample_rate = self._get_audio_from_stream(input_data)
@@ -90,6 +136,20 @@ async def play_with_effects(
         for sound_effect in sound_effects:
             audio = sound_effect(audio, sample_rate)
 
+        mixed_layer_file = None
+        for effect in config.effects:
+            if not mixed_layer_file:
+                mixed_layer_file = get_additional_layer_file(effect)
+
+        if mixed_layer_file:
+            audio = self._mix_in_layer(
+                audio, sample_rate, mixed_layer_file, mixed_layer_gain_boost_db
+            )
+
+        contains_high_end_radio = SoundEffect.HIGH_END_RADIO in config.effects
+        if contains_high_end_radio:
+            audio = self._add_wav_effect(audio, sample_rate, "Radio_Static_Beep.wav")
+
         if config.play_beep:
             audio = self._add_wav_effect(audio, sample_rate, "beep.wav")
         elif config.play_beep_apollo:
@@ -130,9 +190,8 @@ async def notify_playback_finished(self, wingman_name: str):
             await self.on_playback_finished(wingman_name)
 
     def play_wav(self, audio_sample_file: str):
-        bundle_dir = path.abspath(path.dirname(__file__))
         beep_audio, beep_sample_rate = self.get_audio_from_file(
-            path.join(bundle_dir, f"../audio_samples/{audio_sample_file}")
+            path.join(self.sample_dir, audio_sample_file)
         )
         self.start_playback(beep_audio, beep_sample_rate, 1, None)
 
@@ -147,15 +206,21 @@ def _get_audio_from_stream(self, stream: bytes) -> tuple:
     def _add_wav_effect(
         self, audio: np.ndarray, sample_rate: int, audio_sample_file: str
     ) -> np.ndarray:
-        bundle_dir = path.abspath(path.dirname(__file__))
         beep_audio, beep_sample_rate = self.get_audio_from_file(
-            path.join(bundle_dir, f"../audio_samples/{audio_sample_file}")
+            path.join(self.sample_dir, audio_sample_file)
         )
 
         # Resample the beep sound if necessary to match the sample rate of 'audio'
         if beep_sample_rate != sample_rate:
             beep_audio = self._resample_audio(beep_audio, beep_sample_rate, sample_rate)
 
+        # Ensure beep_audio has the same number of channels as 'audio'
+        if beep_audio.ndim == 1 and audio.ndim == 2:
+            beep_audio = np.tile(beep_audio[:, np.newaxis], (1, audio.shape[1]))
+
+        if beep_audio.ndim == 2 and audio.ndim == 1:
+            audio = audio[:, np.newaxis]
+
         # Concatenate the beep sound to the start and end of the audio
         audio_with_beeps = np.concatenate((beep_audio, audio, beep_audio), axis=0)
 
@@ -174,11 +239,52 @@ def _resample_audio(
 
         return resampled_audio
 
+    def _mix_in_layer(
+        self,
+        audio: np.ndarray,
+        sample_rate: int,
+        mix_layer_file: str,
+        mix_layer_gain_boost_db: float = 0.0,
+    ) -> np.ndarray:
+        noise_audio, noise_sample_rate = self.get_audio_from_file(
+            path.join(self.sample_dir, mix_layer_file)
+        )
+
+        if noise_sample_rate != sample_rate:
+            noise_audio = self._resample_audio(
+                noise_audio, noise_sample_rate, sample_rate
+            )
+
+        # Ensure both audio and noise_audio have compatible shapes for addition
+        if noise_audio.ndim == 1:
+            noise_audio = noise_audio[:, None]
+
+        if audio.ndim == 1:
+            audio = audio[:, None]
+
+        if noise_audio.shape[1] != audio.shape[1]:
+            noise_audio = np.tile(noise_audio, (1, audio.shape[1]))
+
+        # Ensure noise_audio length matches audio length
+        if len(noise_audio) < len(audio):
+            repeat_count = int(np.ceil(len(audio) / len(noise_audio)))
+            noise_audio = np.tile(noise_audio, (repeat_count, 1))[: len(audio)]
+
+        noise_audio = noise_audio[: len(audio)]
+
+        # Convert gain boost from dB to amplitude factor
+        amplitude_factor = 10 ** (mix_layer_gain_boost_db / 20)
+
+        # Apply volume scaling to the mixed-in layer
+        audio_with_noise = audio + amplitude_factor * noise_audio
+        return audio_with_noise
+
     async def stream_with_effects(
         self,
         buffer_callback,
         config: SoundConfig,
         wingman_name: str,
+        mix_layer_gain_boost_db: float = 0.0,
         buffer_size=2048,
         sample_rate=16000,
         channels=1,
@@ -188,14 +294,79 @@ async def stream_with_effects(
         buffer = bytearray()
         stream_finished = False
         data_received = False
+        mixed_pos = 0
+
+        mix_layer_file = None
+        for effect in config.effects:
+            if not mix_layer_file:
+                mix_layer_file = get_additional_layer_file(effect)
+                # if we boost the actual audio, we need to boost the mixed layer as well
+                if use_gain_boost:
+                    mix_layer_gain_boost_db += get_azure_workaround_gain_boost(effect)
+
+        if mix_layer_file:
+            noise_audio, noise_sample_rate = self.get_audio_from_file(
+                path.join(self.sample_dir, mix_layer_file)
+            )
+            if noise_sample_rate != sample_rate:
+                noise_audio = self._resample_audio(
+                    noise_audio, noise_sample_rate, sample_rate
+                )
+            if channels > 1 and noise_audio.ndim == 1:
+                noise_audio = np.tile(noise_audio[:, None], (1, channels))
+            noise_audio = noise_audio.flatten()
+
+        def get_mixed_chunk(length):
+            nonlocal mixed_pos, noise_audio
+            chunk = np.zeros(length, dtype=np.float32)
+            remaining = length
+            while remaining > 0:
+                if mixed_pos >= len(noise_audio):
+                    mixed_pos = 0
+                end_pos = min(len(noise_audio), mixed_pos + remaining)
+                chunk[
+                    length - remaining : length - remaining + (end_pos - mixed_pos)
+                ] = noise_audio[mixed_pos:end_pos]
+                remaining -= end_pos - mixed_pos
+                mixed_pos = end_pos
+            return chunk
 
         def callback(outdata, frames, time, status):
-            nonlocal buffer, stream_finished, data_received
-
+            nonlocal buffer, stream_finished, data_received, mixed_pos
             if data_received and len(buffer) == 0:
                 stream_finished = True
-            outdata[: len(buffer)] = buffer[: len(outdata)]
-            buffer = buffer[len(outdata) :]
+                outdata[:] = bytes(len(outdata))  # Fill the buffer with zeros
+                return
+
+            if len(buffer) > 0:
+                num_elements = frames * channels
+                byte_size = np.dtype(dtype).itemsize
+                data_chunk = np.frombuffer(
+                    buffer[: num_elements * byte_size], dtype=dtype
+                ).astype(np.float32)
+
+                if len(data_chunk) < num_elements:
+                    data_chunk = np.pad(
+                        data_chunk, (0, num_elements - len(data_chunk)), "constant"
+                    )
+
+                if channels > 1 and data_chunk.ndim == 1:
+                    data_chunk = np.tile(data_chunk[:, None], (1, channels)).flatten()
+
+                data_chunk = data_chunk[: frames * channels]
+
+                if mix_layer_file:
+                    mix_chunk = get_mixed_chunk(len(data_chunk))
+                    # Convert gain boost from dB to amplitude factor
+                    amplitude_factor = 10 ** (mix_layer_gain_boost_db / 20)
+                    data_chunk = (
+                        data_chunk + mix_chunk[: len(data_chunk)] * amplitude_factor
+                    )
+
+                data_chunk = data_chunk.flatten()
+                data_chunk_bytes = data_chunk.astype(dtype).tobytes()
+                outdata[: len(data_chunk_bytes)] = data_chunk_bytes[: len(outdata)]
+                buffer = buffer[num_elements * byte_size :]
 
         with sd.RawOutputStream(
             samplerate=sample_rate,
@@ -215,6 +386,10 @@ def callback(outdata, frames, time, status):
             elif config.play_beep_apollo:
                 self.play_wav("Apollo_Beep.wav")
 
+            contains_high_end_radio = SoundEffect.HIGH_END_RADIO in config.effects
+            if contains_high_end_radio:
+                self.play_wav("Radio_Static_Beep.wav")
+
             self.raw_stream.start()
 
             sound_effects = get_sound_effects(
@@ -232,17 +407,25 @@ def callback(outdata, frames, time, status):
                         data_in_numpy, sample_rate, reset=False
                     )
 
+                if mix_layer_file:
+                    noise_chunk = get_mixed_chunk(len(data_in_numpy))
+                    # Convert gain boost from dB to amplitude factor
+                    amplitude_factor = 10 ** (mix_layer_gain_boost_db / 20)
+                    data_in_numpy = data_in_numpy + noise_chunk * amplitude_factor
+
                 processed_buffer = data_in_numpy.astype(dtype).tobytes()
                 buffer.extend(processed_buffer)
-
                 await self.stream_event.publish("audio", processed_buffer)
-
                 filled_size = buffer_callback(audio_buffer)
 
             data_received = True
             while not stream_finished:
                 sd.sleep(100)
 
+            contains_high_end_radio = SoundEffect.HIGH_END_RADIO in config.effects
+            if contains_high_end_radio:
+                self.play_wav("Radio_Static_Beep.wav")
+
             if config.play_beep:
                 self.play_wav("beep.wav")
             elif config.play_beep_apollo: