Enforce 25Kb limit for infinite transcription

suvigyajain0101 · web-flow · commit 853fba019877 · 2025-04-14T13:31:39.000+01:00
Current implementation breaks when a new stream is created, even under 5 min limit. This is due to the missing logic to handle 25KB stream size limit [1] Updated the 'generator' function to yield data as soon as API limit is reached. [1] - GoogleCloudPlatform#12053
diff --git a/speech/microphone/transcribe_streaming_infinite_v2.py b/speech/microphone/transcribe_streaming_infinite_v2.py
@@ -40,6 +40,8 @@
 STREAMING_LIMIT = 240000  # 4 minutes
 SAMPLE_RATE = 16000
 CHUNK_SIZE = int(SAMPLE_RATE / 10)  # 100ms
+# 25KB API limit. Increasing this will throw error
+MAX_STREAMING_CHUNK = 25 * 1024 
 
 RED = "\033[0;31m"
 GREEN = "\033[0;32m"
@@ -213,7 +215,23 @@ def generator(self: object) -> object:
                 except queue.Empty:
                     break
 
-            yield b"".join(data)
+            # Enforce max streaming chunk size supported by the API
+            combined_size = sum(len(chunk) for chunk in data)
+            if combined_size <= MAX_STREAMING_CHUNK:
+                yield b"".join(data)
+            else:
+                run_chunks = []
+                run_size = 0
+                for chunk in data:
+                    if len(chunk) + run_size > MAX_STREAMING_CHUNK:
+                        yield b"".join(run_chunks)
+                        run_chunks = [chunk]
+                        run_size = len(chunk)
+                    else:
+                        run_chunks.append(chunk)
+                        run_size += len(chunk)
+                if run_chunks:
+                    yield b"".join(run_chunks)
 
 
 def listen_print_loop(responses: object, stream: object) -> None: