Spaces:

arham061
/

urdu_TTS

Sleeping

App Files Files Community

arham061 commited on Jul 16, 2023

Commit

b80857a

•

1 Parent(s): 87c1174

Update app.py

Browse files

Files changed (1) hide show

app.py +58 -7

app.py CHANGED Viewed

@@ -2,6 +2,8 @@ import torch
 from transformers import SpeechT5ForTextToSpeech, SpeechT5Processor
 import soundfile as sf
 import gradio as gr
 # Load the TTS model from the Hugging Face Hub
 checkpoint = "arham061/speecht5_finetuned_voxpopuli_nl"  # Replace with your actual model name
@@ -12,12 +14,61 @@ tokenizer = processor.tokenizer
 # Buckwalter to Unicode mapping
 buck2uni = {
-    u"\u0627": "A",
-    u"\u0675": "A",
-    u"\u0673": "A",
-    u"\u0630": "A",
-    u"\u0622": "AA",
-    # Rest of the mapping...
 }
 def transString(string, reverse=0):
@@ -54,7 +105,7 @@ def text_to_speech(text):
     audio_output = generate_audio(text)
     # Save audio as a .wav file
-    sf.write("output.wav", audio_output, samplerate=16000, format='wav', subtype='PCM_16', endian='LITTLE', channels=1, dtype='int16', write_id3v2=False, type='numpy')
     return "output.wav"

 from transformers import SpeechT5ForTextToSpeech, SpeechT5Processor
 import soundfile as sf
 import gradio as gr
+import scipy.io.wavfile as wav
+import numpy as np
 # Load the TTS model from the Hugging Face Hub
 checkpoint = "arham061/speecht5_finetuned_voxpopuli_nl"  # Replace with your actual model name
 # Buckwalter to Unicode mapping
 buck2uni = {
+            u"\u0627":"A",
+            u"\u0627":"A",
+            u"\u0675":"A",
+            u"\u0673":"A",
+            u"\u0630":"A",
+            u"\u0622":"AA",
+            u"\u0628":"B",
+            u"\u067E":"P",
+            u"\u062A":"T",
+            u"\u0637":"T",
+            u"\u0679":"T",
+            u"\u062C":"J",
+            u"\u0633":"S",
+            u"\u062B":"S",
+            u"\u0635":"S",
+            u"\u0686":"CH",
+            u"\u062D":"H",
+            u"\u0647":"H",
+            u"\u0629":"H",
+            u"\u06DF":"H",
+            u"\u062E":"KH",
+            u"\u062F":"D",
+            u"\u0688":"D",
+            u"\u0630":"Z",
+            u"\u0632":"Z",
+            u"\u0636":"Z",
+            u"\u0638":"Z",
+            u"\u068E":"Z",
+            u"\u0631":"R",
+            u"\u0691":"R",
+            u"\u0634":"SH",
+            u"\u063A":"GH",
+            u"\u0641":"F",
+            u"\u06A9":"K",
+            u"\u0642":"K",
+            u"\u06AF":"G",
+            u"\u0644":"L",
+            u"\u0645":"M",
+            u"\u0646":"N",
+            u"\u06BA":"N",
+            u"\u0648":"O",
+            u"\u0649":"Y",
+            u"\u0626":"Y",
+            u"\u06CC":"Y",
+            u"\u06D2":"E",
+            u"\u06C1":"H",
+            u"\u064A":"E"  ,
+            u"\u06C2":"AH"  ,
+            u"\u06BE":"H"  ,
+            u"\u0639":"A"  ,
+            u"\u0643":"K" ,
+            u"\u0621":"A",
+            u"\u0624":"O",
+            u"\u060C":"" #seperator ulta comma
 }
 def transString(string, reverse=0):
     audio_output = generate_audio(text)
     # Save audio as a .wav file
+    wav.write("output.wav", 16000, audio_output.astype(np.int16))
     return "output.wav"