Spaces:
Running
Running
Upload app.py
Browse files
app.py
CHANGED
|
@@ -295,6 +295,37 @@ by Kalpi Edition
|
|
| 295 |
download_btn = gr.Button("Save transcript", variant="secondary")
|
| 296 |
download_file = gr.File(label="")
|
| 297 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 298 |
def run(file, model_raw, language, timestamps, translate):
|
| 299 |
model_name = model_raw.split()[0].strip()
|
| 300 |
return transcribe(file, model_name, language, timestamps, translate)
|
|
|
|
| 295 |
download_btn = gr.Button("Save transcript", variant="secondary")
|
| 296 |
download_file = gr.File(label="")
|
| 297 |
|
| 298 |
+
def transcribe(file, model_name, language, show_timestamps, translate):
|
| 299 |
+
if file is None:
|
| 300 |
+
return "⚠️ Please upload a file first.", ""
|
| 301 |
+
|
| 302 |
+
model = load_model(model_name)
|
| 303 |
+
|
| 304 |
+
lang = None if language == "Auto Detect" else language
|
| 305 |
+
task = "translate" if translate == "Translate to English" else "transcribe"
|
| 306 |
+
|
| 307 |
+
# Handle Hinglish — transcribe in Hindi then romanize output
|
| 308 |
+
if language == "Hinglish (Roman)":
|
| 309 |
+
lang = "hi"
|
| 310 |
+
result = model.transcribe(file.name, language=lang, task=task)
|
| 311 |
+
for seg in result["segments"]:
|
| 312 |
+
seg["text"] = devanagari_to_roman(seg["text"])
|
| 313 |
+
result["text"] = devanagari_to_roman(result["text"])
|
| 314 |
+
else:
|
| 315 |
+
result = model.transcribe(file.name, language=lang, task=task)
|
| 316 |
+
|
| 317 |
+
if show_timestamps:
|
| 318 |
+
lines = []
|
| 319 |
+
for seg in result["segments"]:
|
| 320 |
+
start = format_time(seg["start"])
|
| 321 |
+
end = format_time(seg["end"])
|
| 322 |
+
lines.append(f"[{start} → {end}] {seg['text'].strip()}")
|
| 323 |
+
transcript = "\n".join(lines)
|
| 324 |
+
else:
|
| 325 |
+
transcript = result["text"].strip()
|
| 326 |
+
|
| 327 |
+
return transcript, transcript
|
| 328 |
+
|
| 329 |
def run(file, model_raw, language, timestamps, translate):
|
| 330 |
model_name = model_raw.split()[0].strip()
|
| 331 |
return transcribe(file, model_name, language, timestamps, translate)
|