Spaces:

PlotweaverModel
/

Live-Football-Commentary

Running

PlotweaverModel commited on 15 days ago

Commit

79f78ef

verified ·

1 Parent(s): db26bd8

Updating app file

Files changed (1) hide show

app.py CHANGED Viewed

@@ -108,13 +108,30 @@ def split_into_sentences(text):
 def transcribe(audio_array, sample_rate=16000):
-    """ASR: English audio to text."""
     if len(audio_array) < 1600:  # Less than 0.1s
         return ""
-    result = asr_pipe(
-        {"raw": audio_array, "sampling_rate": sample_rate},
-        return_timestamps=False,
-    )
     return result["text"].strip()

 def transcribe(audio_array, sample_rate=16000):
+    """ASR: English audio to text.
+    Automatically handles both short (<30s) and long audio by enabling
+    timestamps and chunking for longer audio.
+    """
     if len(audio_array) < 1600:  # Less than 0.1s
         return ""
+    duration_s = len(audio_array) / sample_rate
+    if duration_s > 28:
+        # Long-form: enable chunking and timestamps (required by Whisper)
+        result = asr_pipe(
+            {"raw": audio_array, "sampling_rate": sample_rate},
+            return_timestamps=True,
+            chunk_length_s=25,
+            stride_length_s=5,
+        )
+    else:
+        # Short: standard single-pass transcription
+        result = asr_pipe(
+            {"raw": audio_array, "sampling_rate": sample_rate},
+            return_timestamps=False,
+        )
     return result["text"].strip()