WhisperSpeech-PDF-text-to-speech

Runtime error

WhisperSpeech-PDF-text-to-speech / app.py

Update app.py

1197cf0 verified 4 months ago

2.08 kB

	import streamlit as st
	from gtts import gTTS
	from io import BytesIO
	import torch
	import torchaudio
	from PyPDF2 import PdfReader
	from whisperspeech.pipeline import Pipeline

	pipe = Pipeline(torch_compile=True)

	st.image('OIG3 (4).jpeg', caption='Your host on this PDF-to-Speech adventure!')

	x = st.slider('Select the number of pages you wish to transcribe')

	uploaded_file = st.file_uploader("Choose a file", "pdf")
	if uploaded_file is not None:
	# creating a pdf reader object
	reader = PdfReader(uploaded_file)
	# printing number of pages in pdf file
	X = len(reader.pages)
	print(X)

	i = 0
	while i <= X and i <= x:
	# getting a specific page from the pdf file
	page = reader.pages[i]
	# extracting text from page
	text = page.extract_text()
	print("Created text of page", i )

	# Generate audio for the current page using a unique filename
	page_audio_file = f"output_{i}.wav"
	pipe.generate_to_file(page_audio_file, text)

	# Display the generated audio using st.audio
	with open(page_audio_file, "rb") as audio_file:
	st.audio(audio_file)

	# sound_file = BytesIO()
	# tts = gTTS(text, lang='en')
	# tts.write_to_fp(sound_file)
	# st.audio(sound_file)
	print("Read aloud", i, "pages of", X, "total pages.")
	i = i + 1
	st.write("🎉 That's the whole PDF! Have an awesome day! 🎉")


	prompt = st.chat_input("Copy/Paste or type in text to have read aloud")
	if prompt:
	st.write(prompt)
	with st.popover("✨ Open your text-to-speech from text input ✨"):
	#sound_file = BytesIO()
	#tts = gTTS(prompt, lang='en')
	#tts.write_to_fp(sound_file)

	#st.audio(sound_file)
	# Generate audio for the current page using a unique filename
	page_audio_file = f"output_{i}.wav"
	pipe.generate_to_file(page_audio_file, text)

	# Display the generated audio using st.audio
	with open(page_audio_file, "rb") as audio_file:
	st.audio(audio_file)