|
import os |
|
import replicate |
|
import streamlit as st |
|
from pydub import AudioSegment |
|
|
|
|
|
replicate_token = os.getenv("REPLICATE_API_TOKEN") |
|
|
|
if not replicate_token: |
|
raise ValueError("No se ha encontrado el token de API de Replicate.") |
|
|
|
|
|
def dividir_audio(audio_path, segment_duration_ms): |
|
audio = AudioSegment.from_file(audio_path) |
|
audio_length = len(audio) |
|
segments = [] |
|
|
|
|
|
for i in range(0, audio_length, segment_duration_ms): |
|
segment = audio[i:i+segment_duration_ms] |
|
segment_path = f"segment_{i // (60 * 1000)}.wav" |
|
segment.export(segment_path, format="wav") |
|
segments.append(segment_path) |
|
|
|
return segments |
|
|
|
|
|
def transcribe_audio(audio_file): |
|
|
|
audio = AudioSegment.from_file(audio_file) |
|
audio_duration_minutes = len(audio) / (1000 * 60) |
|
|
|
|
|
if audio_duration_minutes > 10: |
|
segments = dividir_audio(audio_file, segment_duration_ms=10 * 60 * 1000) |
|
else: |
|
segments = [audio_file] |
|
|
|
|
|
all_transcriptions = [] |
|
|
|
|
|
for segment_path in segments: |
|
with open(segment_path, "rb") as audio: |
|
output = replicate.run( |
|
"vaibhavs10/incredibly-fast-whisper:3ab86df6c8f54c11309d4d1f930ac292bad43ace52d10c80d87eb258b3c9f79c", |
|
input={ |
|
"task": "transcribe", |
|
"audio": audio, |
|
"language": "None", |
|
"timestamp": "chunk", |
|
"batch_size": 64, |
|
"diarise_audio": False |
|
} |
|
) |
|
|
|
all_transcriptions.append(output['text']) |
|
|
|
|
|
full_transcription = "\n".join(all_transcriptions) |
|
return full_transcription |
|
|
|
|
|
|
|
st.title("Transcripci贸n de Audio usando Whisper") |
|
|
|
|
|
uploaded_audio = st.file_uploader("Sube tu archivo de audio", type=["wav", "mp3", "ogg", "flac"]) |
|
|
|
|
|
if uploaded_audio is not None: |
|
|
|
with open("temp_audio_file.wav", "wb") as f: |
|
f.write(uploaded_audio.read()) |
|
|
|
st.info("Transcribiendo el audio, esto puede tardar unos minutos...") |
|
|
|
|
|
transcription = transcribe_audio("temp_audio_file.wav") |
|
|
|
|
|
st.subheader("Transcripci贸n") |
|
st.text(transcription) |
|
|