NeyDev commited on
Commit
06a41c8
·
verified ·
1 Parent(s): 28700b7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +30 -28
app.py CHANGED
@@ -1,28 +1,30 @@
1
- from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
2
- import torch
3
- import librosa
4
- import gradio as gr
5
-
6
- # Cargamos el modelo de guaraní
7
- model_name = "ivangtorre/wav2vec2-xlsr-300m-guarani"
8
- processor = Wav2Vec2Processor.from_pretrained(model_name)
9
- model = Wav2Vec2ForCTC.from_pretrained(model_name)
10
-
11
- # Transcripción
12
- def transcribir(audio):
13
- audio_data, _ = librosa.load(audio, sr=16000)
14
- inputs = processor(audio_data, sampling_rate=16000, return_tensors="pt", padding=True)
15
- with torch.no_grad():
16
- logits = model(**inputs).logits
17
- predicted_ids = torch.argmax(logits, dim=-1)
18
- transcription = processor.batch_decode(predicted_ids)[0]
19
- return transcription.lower()
20
-
21
- # Interfaz de Gradio
22
- demo = gr.Interface(
23
- fn=transcribir,
24
- inputs=gr.Audio(type="filepath"),
25
- outputs="text",
26
- title="Transcriptor Guaraní",
27
- description="Subí un audio en guaraní (.ogg, .wav) y obtené la transcripción"
28
- )
 
 
 
1
+ from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
2
+ import torch
3
+ import librosa
4
+ import gradio as gr
5
+
6
+ # Cargamos el modelo de guaraní
7
+ model_name = "ivangtorre/wav2vec2-xlsr-300m-guarani"
8
+ processor = Wav2Vec2Processor.from_pretrained(model_name)
9
+ model = Wav2Vec2ForCTC.from_pretrained(model_name)
10
+
11
+ # Transcripción
12
+ def transcribir(audio):
13
+ audio_data, _ = librosa.load(audio, sr=16000)
14
+ inputs = processor(audio_data, sampling_rate=16000, return_tensors="pt", padding=True)
15
+ with torch.no_grad():
16
+ logits = model(**inputs).logits
17
+ predicted_ids = torch.argmax(logits, dim=-1)
18
+ transcription = processor.batch_decode(predicted_ids)[0]
19
+ return transcription.lower()
20
+
21
+ # Interfaz de Gradio
22
+ demo = gr.Interface(
23
+ fn=transcribir,
24
+ inputs=gr.Audio(type="filepath"),
25
+ outputs="text",
26
+ title="Transcriptor Guaraní",
27
+ description="Subí un audio en guaraní (.ogg, .wav) y obtené la transcripción"
28
+ )
29
+
30
+ demo.launch()