Spaces:

vgotcheva
/

eloquent-converse

Running

App Files Files Community

demo commited on Feb 25, 2024

Commit

103a375

1 Parent(s): ffd8f44

initial version

Browse files

Files changed (13) hide show

.env +14 -0
.gitignore +1 -0
DEVELOPMENT.md +94 -0
Dockerfile +24 -0
LICENSE +21 -0
README.md +54 -2
app.py +70 -0
compose.yaml +5 -0
fn_diff.py +13 -0
model_llama.py +86 -0
model_llamacpp.py +81 -0
model_wben.py +53 -0
requirements.txt +7 -0

.env ADDED Viewed

	@@ -0,0 +1,14 @@

+GRADIO_SERVER_IP="0.0.0.0"
+GRADIO_SERVER_PORT=7860
+TASK_ASR="automatic-speech-recognition"
+MODEL_WHISPER1="openai/whisper-base.en"
+MODEL_WHISPER1_FILE="model.safetensors"
+TASK_TXTGEN="text-generation"
+MODEL_LLAMA="TheBloke/Llama-2-7b-Chat-GGUF"
+MODEL_LLAMA_FILE="llama-2-7b-chat.Q5_K_M.gguf"
+MODEL_MISTRAL="TheBloke/Mistral-7B-Instruct-v0.2-GGUF"
+MODEL_MISTRAL_FILE="mistral-7b-instruct-v0.2.Q5_K_M.gguf"

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ __pychache__

DEVELOPMENT.md ADDED Viewed

	@@ -0,0 +1,94 @@

+# Installation Notes for Development
+## Running Eloquent App in Docker
+The easiest way to install and run the Eloquent app is using the docker container from HuggingFace. You will need to have docker installed on your system (see prerequisites below) and then run the app container:
+```
+docker run -it -p 7860:7860 --platform=linux/amd64 \
+	registry.hf.space/vgotcheva-eloquent:latest
+```
+When the app container is fully started in docker, the app can be accessed in the browser with [http://localhost:7860](http://localhost:7860).
+Eloquent App is a gradio app written in python. It uses ```automatic-speech-recognition``` and ```text-generation``` models through HuggingFace transformers library.
+The app has been tested on a laptop with specifications:
+- CPU: 11th Gen Intel(R) Core(TM) i7-1165G7 @ 2.80GHz
+- RAM: 16.0 GB
+- GPU: none
+- SSD: at least 25GB available space
+Note that the AI models (about 6GB total) will be downloaded and cached locally during the docker container start up. Therefore, it may take 10-15min for the app to start depending on the download speed.
+## Running Eloquent App in Python Environment
+The app can be run in a python development environment. Please, check the prerequisites below.
+Clone the repository and cd in the cloned folder:
+```
+git clone https://huggingface.co/spaces/vgotcheva/eloquent
+cd eloquent
+```
+Install the app requirements:
+```
+pip install --no-cache-dir --upgrade -r /code/requirements.txt
+```
+Start the app:
+```
+python app.py
+```
+Use the app by opening in browser [http://localhost:7860](http://localhost:7860).
+## Prerequisites for development under Windows 11
+### Visual Studio Code
+https://code.visualstudio.com/
+### Git for Windows including Git Credential Manager
+https://gitforwindows.org/
+### WSL 2 (with Git for Windows)
+https://learn.microsoft.com/en-us/windows/wsl/install
+### Linux Distribution in WSL
+```
+Ubuntu 20.04.6 LTS
+```
+### git and gif-lft
+```bash
+apt-get install git git-lfs
+```
+### Anaconda in Ubuntu
+```bash
+$ conda -V
+conda 23.11.0
+```
+### conda virtual environment and pip
+- https://conda.io/projects/conda/en/latest/user-guide/tasks/manage-environments.html#activating-an-environment
+- https://anaconda.org/anaconda/pip
+### Set up Git Credentials Manager in Ubuntu git
+https://github.com/git-ecosystem/git-credential-manager/blob/release/docs/wsl.md
+```
+git config --global credential.helper '/mnt/c/Program Files/Git/mingw64/bin/git-credential-manager.exe'
+```
+or add it directly to
+```
+$ cat ~/.gitconfig
+[user]
+        name = demo
+        email = demo@local
+[credential]
+        helper = /mnt/c/Program\\ Files/Git/mingw64/bin/git-credential-manager.exe
+```
+https://docs.gitlab.com/ee/ci/ci_cd_for_external_repos/
+### Docker Desktop WSL 2 backend on Windows
+https://docs.docker.com/desktop/wsl/

Dockerfile ADDED Viewed

	@@ -0,0 +1,24 @@

+FROM registry.hf.space/vgotcheva-base-dev:latest
+#FROM python:3.9
+#ARG GRADIO_SERVER_PORT=7000
+#ENV GRADIO_SERVER_PORT=${GRADIO_SERVER_PORT}
+RUN apt-get update && apt-get install -y python3 python3-pip
+RUN useradd -m -u 1000 user
+USER user
+ENV HOME=/home/user \
+    PATH=/home/user/.local/bin:$PATH
+WORKDIR $HOME/app
+COPY --chown=user . $HOME/app
+#WORKDIR /code
+#COPY ./requirements.txt /code/requirements.txt
+RUN pip install --no-cache-dir --upgrade pip
+RUN pip install --no-cache-dir --upgrade -r requirements.txt
+# Needed for caching the llama model due to its large size
+RUN python -c "import model_llama as ml; ml.cached_folder"
+CMD ["python", "app.py"]

LICENSE ADDED Viewed

	@@ -0,0 +1,21 @@

+MIT License
+Copyright (c) 2024 Violeta Gotcheva
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

README.md CHANGED Viewed

@@ -1,11 +1,63 @@
 ---
-title: Eloquent Converse
-emoji: 🌖
 colorFrom: blue
 colorTo: indigo
 sdk: docker
 pinned: false
 license: cc0-1.0
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Eloquent
+emoji: 👀
 colorFrom: blue
 colorTo: indigo
 sdk: docker
 pinned: false
+startup_duration_timeout: 1h
 license: cc0-1.0
+app_port: 7860
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+# Eloquent App: A private coach to speaking clearly
+## Introduction
+Eloquent App is a gradio app written in python. The app has been tested offline on a laptop with specifications:
+- CPU: 11th Gen Intel(R) Core(TM) i7-1165G7 @ 2.80GHz
+- RAM: 16.0 GB
+- GPU: none
+- SSD: at least 25GB available space
+The app uses ```automatic-speech-recognition``` and ```text-generation``` models through HuggingFace supported libraries.
+The AI models are about 6GB total. They will be downloaded and cached locally when the app is started for the first time. Therefore, network connection is required and it may take 10-15min for the app to start depending on the download speed.
+## How to run the app on local computer
+Clone from the GitLab repository:
+```bash
+git clone https://gitlab.com/vgotcheva/eloquent-gitlab.git
+```
+Then go in the cloned folder ```cd eloquent``` and install python dependencies:
+```
+pip install --no-cache-dir --upgrade -r requirements.txt
+```
+Run the app.py with python:
+```
+python app.py
+```
+## How to run the app in docker on local computer
+You will need docker and docker compose installed and started on your local computer. [Get Docker](https://docs.docker.com/get-docker/)
+Go in the cloned folder ```cd eloquent``` and run docker compose:
+```
+docker compose up -d
+```
+The above command will build the image when it is executed for the first time and then start a docker container with image.
+Verify that the image is created and container running
+```
+docker image ls
+docker ps
+```
+## How to use the app:
+Use the app by opening it in your browser:
+http://0.0.0.0:7860
+## Development Environment
+For notes on setting a development environment read [DEVELOPMENT.md](DEVELOPMENT.md)

app.py ADDED Viewed

	@@ -0,0 +1,70 @@

+import os
+from dotenv import load_dotenv
+import numpy as np
+import gradio as gr
+# eloquent imports
+import model_wben as asr
+import model_llama as llm
+#import model_llamacpp as llm
+import fn_diff as dff
+load_dotenv()
+## Front-End
+with gr.Blocks() as demo:
+    # record audio
+    gr.Markdown(
+        """
+        # Eloquent is ready.
+        Press the Record.
+        Start Speaking.
+        Press Stop.
+        Click on Transcribe.
+        Transcription and improved text will appear below.
+        """
+        )
+    myspeech = gr.Audio(sources=["microphone"])
+    with gr.Row():
+     with gr.Column():
+       # transcribe
+       b1 = gr.Button("Click to Transcribe Audio")
+       mytranscription = gr.Textbox(
+          label="speech transcription",
+          autoscroll=True,
+          max_lines=5
+       )
+     with gr.Column():
+       b2 = gr.Button("Click to Improve Transcription")
+       myspeech_improved = gr.Textbox(
+          label="improved speech"
+       )
+    myspeech_diff = gr.HighlightedText(
+        label="transcript and improved speech differences",
+        combine_adjacent=True,
+        show_legend=True,
+        color_map={"+": "green", "-": "red"})
+    b1.click(fn=asr.transcribe, inputs=myspeech, outputs=mytranscription)
+    b2.click(fn=llm.improve_grammar,
+                 inputs=[mytranscription],
+                 outputs=[myspeech_improved]
+    )
+    myspeech_improved.change(fn=dff.diff_texts,
+              inputs=[mytranscription,myspeech_improved],
+              outputs=myspeech_diff
+    )
+if __name__ == "__main__":
+    demo.queue()
+    demo.launch(
+        share=False,
+        server_name=os.getenv('GRADIO_SERVER_IP'),
+        server_port=int(os.getenv('GRADIO_SERVER_PORT'))
+    )

compose.yaml ADDED Viewed

	@@ -0,0 +1,5 @@

+services:
+  app:
+    build: .
+    ports:
+      - "${GRADIO_SERVER_IP}:${GRADIO_SERVER_PORT}:${GRADIO_SERVER_PORT}"

fn_diff.py ADDED Viewed

	@@ -0,0 +1,13 @@

+from difflib import Differ
+def diff_texts(text1, text2):
+    d = Differ()
+    d3= []
+    for token in d.compare(text1, text2):
+        if token[0] != '-':
+            if token[0] != " ":
+               d3.append((token[2:], token[0]))
+            else:
+                d3.append((token[2:], None))
+    return d3

model_llama.py ADDED Viewed

	@@ -0,0 +1,86 @@

+import os
+from dotenv import load_dotenv
+import numpy as np
+from huggingface_hub import snapshot_download
+#from difflib import Differ
+import gradio as gr
+#from transformers import pipeline
+#from llama_cpp import Llama
+from ctransformers import AutoModelForCausalLM
+load_dotenv()
+task_asr=os.getenv('TASK_TXTGEN')
+model_id=os.getenv('MODEL_MISTRAL')
+model_file=os.getenv('MODEL_MISTRAL_FILE')
+cached_folder=snapshot_download(
+      repo_id=model_id,
+      allow_patterns=model_file,
+      local_dir=None
+    )
+def get_cached_folder():
+   return cached_folder
+llm = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    model_file=model_file,
+    model_type="llama"
+#    gpu_layers=50
+    )
+B_INST, E_INST = "<s>[INST]", "[/INST]"
+B_SYS, E_SYS = "<<SYS>>\n", "\n<</SYS>>\n\n"
+DEFAULT_SYSTEM_PROMPT = """\
+You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.
+If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.
+Correct the grammar in the user text.
+"""
+SYSTEM_PROMPT = B_SYS + DEFAULT_SYSTEM_PROMPT + E_SYS
+def get_prompt(instruction):
+    prompt_template =  B_INST + SYSTEM_PROMPT + instruction + E_INST
+    return prompt_template
+def improve_grammar(text_input):
+    #https://huggingface.co/mzbac/mistral-grammar
+    #https://llama-cpp-python.readthedocs.io/en/latest/
+    input_prompt = get_prompt(text_input)
+    text_output = llm(
+        input_prompt,
+        temperature=0.0,
+#        top_p=0.1,
+#        top_k=40,
+#        repeat_penalty=1.1,
+#        max_tokens=2048,
+#        n_ctx=2048,
+#        echo=False
+    )
+    return text_output
+if __name__ == "__main__":
+    with gr.Blocks() as demo:
+      mytextinput = gr.Textbox("This is a test box.")
+      b1 = gr.Button("Click to improve text")
+      mytextimproved = gr.Textbox(
+        label="Improved text"
+      )
+      b1.click(
+         fn=improve_grammar,
+         inputs=mytextinput,
+         outputs=mytextimproved
+      )
+    demo.queue()
+    demo.launch(
+        share=False,
+        server_name=os.getenv('GRADIO_SERVER_IP'),
+        server_port=int(os.getenv('GRADIO_SERVER_PORT'))
+    )

model_llamacpp.py ADDED Viewed

	@@ -0,0 +1,81 @@

+import os
+from dotenv import load_dotenv
+import numpy as np
+from huggingface_hub import snapshot_download
+from llama_cpp import Llama
+import gradio as gr
+load_dotenv()
+task_asr=os.getenv('TASK_TXTGEN')
+model_id=os.getenv('MODEL_MISTRAL')
+model_file=os.getenv('MODEL_MISTRAL_FILE')
+cached_file=snapshot_download(
+      repo_id=model_id,
+      allow_patterns=model_file,
+      local_dir=None
+    )
+def get_cached_file():
+    return cached_file
+llm = Llama(
+    model_path=cached_file + "/" + model_file,
+    verbose=False
+    )
+B_INST, E_INST = "<s>[INST]", "[/INST]"
+B_SYS, E_SYS = "<<SYS>>\n", "\n<</SYS>>\n\n"
+DEFAULT_SYSTEM_PROMPT = """\
+You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.
+If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.
+Correct the grammar in the user text.
+"""
+SYSTEM_PROMPT = B_SYS + DEFAULT_SYSTEM_PROMPT + E_SYS
+def get_prompt(instruction):
+    prompt_template =  B_INST + SYSTEM_PROMPT + instruction + E_INST
+    return prompt_template
+def improve_grammar(text_input):
+    #https://huggingface.co/mzbac/mistral-grammar
+    #https://llama-cpp-python.readthedocs.io/en/latest/
+    input_prompt = get_prompt(text_input)
+    text_output = llm(
+        input_prompt,
+        temperature=0.0,
+        top_p=0.1,
+        top_k=40,
+        repeat_penalty=1.1,
+        max_tokens=2048,
+#        n_ctx=2048,
+        echo=False
+    )
+    return text_output['choices'][0]['text']
+if __name__ == "__main__":
+    with gr.Blocks() as demo:
+      mytextinput = gr.Textbox("This is a test box.")
+      b1 = gr.Button("Click to improve text")
+      mytextimproved = gr.Textbox(
+        label="Improved text"
+      )
+      b1.click(
+         fn=improve_grammar,
+         inputs=mytextinput,
+         outputs=mytextimproved
+      )
+    demo.queue()
+    demo.launch(
+        share=False,
+        server_name=os.getenv('GRADIO_SERVER_IP'),
+        server_port=int(os.getenv('GRADIO_SERVER_PORT'))
+    )

model_wben.py ADDED Viewed

	@@ -0,0 +1,53 @@

+import os
+from dotenv import load_dotenv
+from huggingface_hub import snapshot_download
+import numpy as np
+import gradio as gr
+from transformers import pipeline
+load_dotenv()
+task_asr=os.getenv('TASK_ASR')
+model_id=os.getenv('MODEL_WHISPER1')
+model_file=os.getenv('MODEL_WHISPER1_FILE')
+def get_model_file():
+   cached_file=snapshot_download(
+      repo_id=model_id,
+      allow_patterns=model_file,
+      local_dir=None
+    )
+   return cached_file
+asr = pipeline(task_asr, model=model_id)
+def transcribe(audio):
+    sr, y = audio
+    y = y.astype(np.float32)
+    y /= np.max(np.abs(y))
+    return asr({"sampling_rate": sr, "raw": y})["text"]
+if __name__ == "__main__":
+    with gr.Blocks() as demo:
+      myspeech = gr.Audio(sources=["microphone"])
+      b1 = gr.Button("Click to Transcribe")
+      mytranscription = gr.Textbox(
+        label="speech transcription",
+        autoscroll=True,
+        max_lines=5
+      )
+      b1.click(
+         fn=transcribe,
+         inputs=myspeech,
+         outputs=mytranscription
+         )
+    demo.queue()
+    demo.launch(
+        share=False,
+        server_name=os.getenv('GRADIO_SERVER_IP'),
+        server_port=int(os.getenv('GRADIO_SERVER_PORT'))
+    )

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+python-dotenv==0.21.0
+gradio==4.16.0
+transformers==4.37.2
+ctransformers==0.2.27
+torch==2.2.0
+torchaudio==2.2.0
+llama_cpp_python==0.2.44