Xhaheen's picture
Update app.py
f291f2f
import whisper
import gradio as gr
import time
import warnings
import torch
import os
import openai
from PIL import Image
import requests
from io import BytesIO
import time
time_now = time.time()
# openai.api_key = '' # your api key
openai.api_key = os.environ["api_key"]
model = whisper.load_model("base")
# model = whisper.load_model("medium.en")
def transcribe(audio, text, langauge):
if audio is None:
result_text = text
else:
# load audio and pad/trim it to fit 30 seconds
audio = whisper.load_audio(audio)
audio = whisper.pad_or_trim(audio)
# make log-Mel spectrogram and move to the same device as the model
mel = whisper.log_mel_spectrogram(audio).to(model.device)
# detect the spoken language
_, probs = model.detect_language(mel)
# decode the audio
options = whisper.DecodingOptions(fp16 = False)
result = whisper.decode(model, mel, options)
result_text = result.text
# ...
response = openai.Completion.create(
model="text-davinci-003",
prompt=f"write a full poem on {result_text}in {langauge}language",
temperature=0.7,
max_tokens=1000,
top_p=1,
frequency_penalty=0,
presence_penalty=0
)
out_result=response.choices[0].text
response = openai.Image.create(
prompt=f" {result_text}"+"animated 4k",
n=1,
size="512x512"#"1024x1024"
)
image_url = response['data'][0]['url']
response = requests.get(image_url)
out_image = Image.open(BytesIO(response.content))
return [result_text
, out_result
, out_image
]
output_1 = gr.Textbox(label="Speech to Text")
output_2 = gr.Textbox(label="GPT-3 Davinci Output")
output_3 = gr.Image(label="DallE Output")
gr.Interface(
fn=transcribe,
inputs=[
gr.inputs.Audio(source="microphone",label="use whisper tell app topic of poem , use text input below if you have problem with mic", type="filepath"),
gr.Textbox(label="poem on(Use english word mostly)"),
gr.Textbox(label="language")
],
outputs=[
output_1
, output_2
, output_3
],
title = "" +'Children of heaven🌸🏡: Create Beautiful multilingual Poems with Relevant Images'+ "",
description="Children of heaven🌸🏡is a web app that uses artificial intelligence to generate beautiful multilingual poems and relevant images. With its powerful language GPT3 model, it can create unique and inspiring multilingual poems on a wide range of childrens' topics, and its Dall E model creates images that perfectly complement the poem. Give children of heaven a try and discover the magic of multilingual poetry and art. Whether you're a professional or kid , this app is sure to spark your creativity and inspire you to create something beautiful.this is research work kindly report any bias in content in community section "
).launch(debug=True)