Spaces:

Amelia-James
/

voice-cloning-app

Sleeping

App Files Files Community

Amelia-James commited on 15 days ago

Commit

af12bd1

•

1 Parent(s): 1564098

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -23

app.py CHANGED Viewed

@@ -11,7 +11,7 @@ client = Groq(api_key=os.getenv("GROQ_API_KEY"))
 # Streamlit UI
 st.title("Voice Cloning Application")
-st.markdown("Clone your voice using Groq's Whisper Model and generate natural responses.")
 # Upload audio file
 uploaded_file = st.file_uploader(
@@ -24,34 +24,21 @@ if uploaded_file is not None:
     st.audio(uploaded_file, format=f"audio/{uploaded_file.type.split('.')[-1]}")
     st.write("Transcription in progress...")
-    # Transcription Logic
     try:
-        transcription = client.chat.completions.create(
-            messages=[
-                {
-                    "role": "user",
-                    "content": f"Transcribe the following audio file: {uploaded_file.name}"
-                }
-            ],
             model="whisper-large-v3-turbo",
         )
         # Display the transcription
-        transcribed_text = transcription.choices[0].message.content
         st.success("Transcription completed!")
-        st.write("**Transcribed Text:**", transcribed_text)
-        # Placeholder for voice cloning (TTS integration can go here)
-        st.markdown("---")
-        st.subheader("Generate Speech from Transcription")
-        tts_input = st.text_area("Enter text to generate speech:", value=transcribed_text)
-        if st.button("Generate Speech"):
-            if tts_input:
-                # Simulate TTS functionality (placeholder for TTS model integration)
-                st.success("Generated speech successfully! (Placeholder)")
-            else:
-                st.warning("Please enter some text.")
     except Exception as e:
         st.error(f"Error during transcription: {e}")

 # Streamlit UI
 st.title("Voice Cloning Application")
+st.markdown("Clone your voice using Groq's Whisper Model for transcription.")
 # Upload audio file
 uploaded_file = st.file_uploader(
     st.audio(uploaded_file, format=f"audio/{uploaded_file.type.split('.')[-1]}")
     st.write("Transcription in progress...")
+    # Read file contents as binary
+    audio_bytes = uploaded_file.read()
     try:
+        # Transcription request to the Whisper model
+        transcription = client.audio.transcriptions.create(
+            file=audio_bytes,
             model="whisper-large-v3-turbo",
+            response_format="text",  # Options: "text", "json"
         )
         # Display the transcription
         st.success("Transcription completed!")
+        st.write("**Transcribed Text:**")
+        st.text_area("Transcription", transcription, height=200)
     except Exception as e:
         st.error(f"Error during transcription: {e}")