Spaces:

BenDaouda
/

ASR_Audio_to_wolof

Runtime error

BenDaouda commited on Apr 20, 2023

Commit

832feba

•

1 Parent(s): 9d1a6b5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,17 +1,17 @@
-from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
-import torch
-import gradio as gr
-model = Wav2Vec2ForCTC.from_pretrained("BenDaouda/wav2vec2-large-xls-r-300m-wolof-test-coloab")
-processor = Wav2Vec2Processor.from_pretrained("BenDaouda/wav2vec2-large-xls-r-300m-wolof-test-coloab")
 def transcribe(audio):
-    input_values = tokenizer(audio, return_tensors="pt").input_values
-    with torch.no_grad():
-        logits = model(input_values).logits
-    predicted_ids = torch.argmax(logits, dim=-1)
-    transcription = tokenizer.batch_decode(predicted_ids)[0]
-    return transcription
 iface = gr.Interface(
     fn=transcribe,
@@ -19,4 +19,4 @@ iface = gr.Interface(
     outputs="text"
 )
-iface.launch()

+from transformers import pipeline, AutoTokenizer
+# Spécifiez le nom du modèle et le jeton d'authentification
+model_name = "BenDaouda/wav2vec2-large-xls-r-300m-wolof-test-coloab"
+token = "votre-jeton-d'authentification-hugging-face"
+# Chargez le modèle et le tokenizer en utilisant le jeton d'authentification
+tokenizer = AutoTokenizer.from_pretrained(model_name, use_auth_token=True)
+model = pipeline("automatic-speech-recognition", model=model_name, tokenizer=tokenizer, task="asr", use_auth_token=True)
+# Utilisez la fonction Gradio avec votre modèle chargé
 def transcribe(audio):
+    result = model(audio)
+    return result[0]['text']
 iface = gr.Interface(
     fn=transcribe,
     outputs="text"
 )
+iface.launch()