WhisperSpeech-PDF-text-to-speech

Runtime error

App Files Files Community

WhisperSpeech-PDF-text-to-speech / app.py

Solshine

Update app.py

690df34 verified 4 months ago

raw history blame contribute delete

No virus

2.14 kB

	import streamlit as st
	from gtts import gTTS
	from io import BytesIO
	import torch
	import torchaudio
	from PyPDF2 import PdfReader
	from whisperspeech.pipeline import Pipeline

	st.image('OIG3 (4).jpeg', caption='Your host on this PDF-to-Speech adventure!')

	st.write("⏳ Loading WhisperSpeech Pipeline ⌛")
	pipe = Pipeline(torch_compile=True)
	# TTS pipeline

	x = st.slider('Select the number of pages you wish to transcribe')

	uploaded_file = st.file_uploader("Choose a file", "pdf")
	if uploaded_file is not None:
	# creating a pdf reader object
	reader = PdfReader(uploaded_file)
	# printing number of pages in pdf file
	X = len(reader.pages)
	print(X)

	i = 0
	while i <= X and i <= x:
	# getting a specific page from the pdf file
	page = reader.pages[i]
	# extracting text from page
	text = page.extract_text()
	print("Created text of page", i )

	# Generate audio for the current page using a unique filename
	page_audio_file = f"output_{i}.wav"
	pipe.generate_to_file(page_audio_file, text)

	# Display the generated audio using st.audio
	with open(page_audio_file, "rb") as audio_file:
	st.audio(audio_file)

	# sound_file = BytesIO()
	# tts = gTTS(text, lang='en')
	# tts.write_to_fp(sound_file)
	# st.audio(sound_file)
	print("Read aloud", i, "pages of", X, "total pages.")
	i = i + 1
	st.write("🎉 That's the whole PDF! Have an awesome day! 🎉")


	prompt = st.chat_input("Copy/Paste or type in text to have read aloud")
	if prompt:
	st.write(prompt)
	with st.popover("✨ Open your text-to-speech from text input ✨"):
	#sound_file = BytesIO()
	#tts = gTTS(prompt, lang='en')
	#tts.write_to_fp(sound_file)

	#st.audio(sound_file)
	# Generate audio for the current page using a unique filename
	page_audio_file = f"output_{i}.wav"
	pipe.generate_to_file(page_audio_file, text)

	# Display the generated audio using st.audio
	with open(page_audio_file, "rb") as audio_file:
	st.audio(audio_file)