Spaces:

nbiish
/

boozhoo_bot_prelangchain

Sleeping

App Files Files Community

K3NW48 commited on Mar 23, 2023

Commit

62b117d

•

1 Parent(s): dc2f095

release

Browse files

Files changed (5) hide show

README.md +3 -3
app.py +133 -0
input_audio.wav +0 -0
requirements.txt +143 -0
response.mp3 +0 -0

README.md CHANGED Viewed

@@ -1,8 +1,8 @@
 ---
 title: BoozhooBot
-emoji: 🦀
-colorFrom: green
-colorTo: red
 sdk: gradio
 sdk_version: 3.23.0
 app_file: app.py

 ---
 title: BoozhooBot
+emoji: 😻
+colorFrom: indigo
+colorTo: indigo
 sdk: gradio
 sdk_version: 3.23.0
 app_file: app.py

app.py ADDED Viewed

	@@ -0,0 +1,133 @@

+# Import the required libraries
+import gradio as gr
+import openai
+from gtts import gTTS
+from pydub import AudioSegment
+import os
+messages = [{"role": "system", "content": 'You are the Anishinaabe hero Nanaboozhoo. Not only do you answer with profound wisdom but you will continue the conversation by answering like this, Boozhoo: (your answer)'}]
+full_transcript = []
+openai.api_key = ""
+audio_file = 'response.mp3'
+def set_api(my_key):
+    openai.api_key = my_key
+def create_image(response):
+    # Send text to be summarized
+    dalle_prompt = openai.ChatCompletion.create(
+        model="gpt-3.5-turbo",
+        messages=[
+        {"role": "user", "content": f'Summarize this text "{response["choices"][0]["message"]["content"]}" into a short and concise Dall-E 2 prompt starting with "A Professional photograph of an Anishinaabe person saying :(summarization)".'}
+        ]
+    )
+    # Use summary as prompt for pic
+    dalle_summary = openai.Image.create(
+            prompt = dalle_prompt["choices"][0]["message"]["content"],
+            size="512x512"
+        )
+    image_url = dalle_summary['data'][0]['url']
+    return image_url
+def speak(system_message):
+    global audio_file
+    content = system_message['content']
+    tts = gTTS(content, lang='en', slow=False)
+    tts.save("response.mp3")
+    return "response.mp3"
+def transcribe(gradio_input, api_key):
+    global messages
+    global full_transcript
+    global audio_file
+    set_api(api_key)
+    #Transcribe audio
+    input_audio = AudioSegment.from_file(gradio_input)
+    input_audio.export("input_audio.wav", format="wav")
+    with open("input_audio.wav", "rb") as audio_file:
+        print(f"Audio file format: {os.path.splitext(audio_file.name)[1]}\n")
+        transcript = openai.Audio.transcribe("whisper-1", audio_file)
+    #Append content to messages
+    full_transcript.append(transcript["text"])
+    messages.append({"role": "user", "content": transcript["text"]})
+    #Send the latest set of messages to OpenAI to get a response
+    response = openai.ChatCompletion.create(
+        model="gpt-3.5-turbo",
+        messages=messages
+    )
+    # Extract the latest system message from the response and add it as a new message to the messages list
+    system_message = response["choices"][0]["message"]
+    messages.append(system_message)
+    pic_url = create_image(response)
+    speech = speak(system_message)
+    # Combine all messages in the messages list to create a chat transcript
+    chat_transcript = ""
+    for message in messages:
+        if message['role'] != 'system':
+            chat_transcript += message['role'] + ": " + message['content'] + "\n\n"
+    return speech, chat_transcript, pic_url
+MY_INFO = '\nSupport me at my [Linktree](https://linktr.ee/Nbiish).'
+API_INFO = 'Get your api key at [platform.openai.com/account/api-keys](https://platform.openai.com/account/api-keys)'
+# Create a Gradio interface
+demo = gr.Interface(
+    fn=transcribe,
+    inputs=[
+        gr.Audio(source="microphone", type="filepath", show_label=False),
+        gr.Textbox(
+            label="OpenAI API Key",
+            lines=1,
+            placeholder="Enter your OpenAI API key",
+            default=None,
+            type="password",
+            fn=set_api,
+        ),
+    ],
+    outputs=[
+        gr.Audio(show_label=False),
+        gr.Textbox(label="Transcript:"),
+        gr.Image(show_label=False),
+    ],
+    title="Boozhoo Bot",
+    description=f"""
+    Anishinaabe Chatbot
+    Applies OpenAI's Whisper to transcribe audio input.
+    GPT-3.5 Turbo to generate a response.
+    Dall-E 2.0 to generate an image.
+    gTTS to generate audio response.
+    1) Record to get started
+    2) Press X near recording to keep going
+    3) Refresh page to restart
+    {MY_INFO}
+    {API_INFO}
+    """,
+)
+if __name__ == "__main__":
+    demo.queue().launch()

input_audio.wav ADDED Viewed

Binary file (121 kB). View file

requirements.txt ADDED Viewed

	@@ -0,0 +1,143 @@

+aiofiles==23.1.0
+aiohttp==3.8.4
+aiosignal==1.3.1
+altair==4.2.2
+anyio==3.6.2
+async-timeout==4.0.2
+attrs==21.2.0
+Automat==20.2.0
+Babel==2.8.0
+bcrypt==3.2.0
+black==21.10b0
+blinker==1.4
+certifi==2020.6.20
+cffi==1.15.1
+chardet==4.0.0
+charset-normalizer==3.0.1
+click==8.0.3
+cloud-init==22.4.2
+colorama==0.4.4
+command-not-found==0.3
+config==0.5.1
+configobj==5.0.6
+constantly==15.1.0
+contourpy==1.0.7
+cryptography==3.4.8
+cycler==0.11.0
+dbus-python==1.2.18
+distlib==0.3.4
+distro==1.7.0
+distro-info===1.1build1
+entrypoints==0.4
+fastapi==0.92.0
+ffmpy==0.3.0
+filelock==3.6.0
+Flask==2.2.3
+fonttools==4.38.0
+frozenlist==1.3.3
+fsspec==2023.1.0
+gradio==3.23.0
+gTTS==2.3.1
+h11==0.14.0
+httpcore==0.16.3
+httplib2==0.20.2
+httpx==0.23.3
+huggingface-hub==0.13.3
+hyperlink==21.0.0
+idna==3.3
+importlib-metadata==4.6.4
+incremental==21.3.0
+ipython_genutils==0.2.0
+itsdangerous==2.1.2
+jeepney==0.7.1
+Jinja2==3.0.3
+jsonpatch==1.32
+jsonpointer==2.0
+jsonschema==3.2.0
+jupyter-core==4.9.1
+keyring==23.5.0
+kiwisolver==1.4.4
+launchpadlib==1.10.16
+lazr.restfulclient==0.14.4
+lazr.uri==1.0.6
+linkify-it-py==2.0.0
+markdown-it-py==2.2.0
+MarkupSafe==2.1.2
+matplotlib==3.7.0
+mdit-py-plugins==0.3.3
+mdurl==0.1.2
+more-itertools==8.10.0
+multidict==6.0.4
+mypy-extensions==0.4.3
+netifaces==0.11.0
+numpy==1.24.2
+oauthlib==3.2.0
+openai==0.27.2
+orjson==3.8.7
+packaging==23.0
+pandas==1.5.3
+pathspec==0.9.0
+pexpect==4.8.0
+Pillow==9.4.0
+pipenv==11.9.0
+platformdirs==2.5.1
+ptyprocess==0.7.0
+pyasn1==0.4.8
+pyasn1-modules==0.2.1
+PyAudio==0.2.13
+pycparser==2.21
+pycryptodome==3.17
+pydantic==1.10.5
+pydub==0.25.1
+Pygments==2.11.2
+PyGObject==3.42.1
+PyHamcrest==2.0.2
+PyJWT==2.3.0
+pymacaroons==0.13.0
+PyNaCl==1.5.0
+pyOpenSSL==21.0.0
+pyparsing==2.4.7
+pypng==0.20220715.0
+pyrsistent==0.18.1
+pyserial==3.5
+python-apt==2.4.0+ubuntu1
+python-dateutil==2.8.2
+python-debian===0.1.43ubuntu1
+python-dotenv==0.21.1
+python-magic==0.4.24
+python-multipart==0.0.6
+pyttsx3==2.90
+pytz==2022.1
+PyYAML==5.4.1
+requests==2.28.2
+rfc3986==1.5.0
+SecretStorage==3.3.1
+semantic-version==2.10.0
+service-identity==18.1.0
+six==1.16.0
+sniffio==1.3.0
+sos==4.4
+SpeechRecognition==3.9.0
+ssh-import-id==5.11
+starlette==0.25.0
+systemd-python==234
+tomli==1.2.2
+toolz==0.12.0
+tqdm==4.64.1
+traitlets==5.1.1
+Twisted==22.1.0
+typing_extensions==4.5.0
+ubuntu-advantage-tools==8001
+uc-micro-py==1.0.1
+ufw==0.36.1
+unattended-upgrades==0.1
+urllib3==1.26.5
+uvicorn==0.20.0
+virtualenv==20.13.0+ds
+virtualenv-clone==0.3.0
+wadllib==1.3.6
+websockets==10.4
+Werkzeug==2.2.3
+yarl==1.8.2
+zipp==1.0.0
+zope.interface==5.4.0

response.mp3 ADDED Viewed

Binary file (53 kB). View file