ANIMA-7B-Biomimicry-LLM

Sleeping

App Files Files Community

Severian commited on Nov 11, 2023

Commit

5b800e8

1 Parent(s): 22e0496

Upload 2 files

Browse files

Files changed (2) hide show

Dockerfile +47 -0
app.py +84 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,47 @@

+ARG CUDA_IMAGE="12.1.1-devel-ubuntu22.04"
+FROM nvidia/cuda:${CUDA_IMAGE}
+# We need to set the host to 0.0.0.0 to allow outside access
+ENV HOST 0.0.0.0
+RUN apt-get update && apt-get upgrade -y \
+    && apt-get install -y git build-essential \
+    python3 python3-pip gcc wget \
+    ocl-icd-opencl-dev opencl-headers clinfo \
+    libclblast-dev libopenblas-dev \
+    && mkdir -p /etc/OpenCL/vendors && echo "libnvidia-opencl.so.1" > /etc/OpenCL/vendors/nvidia.icd
+COPY . .
+# setting build related env vars
+ENV CUDA_DOCKER_ARCH=all
+ENV LLAMA_CUBLAS=1
+# Install depencencies
+RUN python3 -m pip install --upgrade pip pytest cmake \
+    scikit-build setuptools fastapi uvicorn sse-starlette \
+    pydantic-settings starlette-context gradio huggingface_hub hf_transfer
+# Install llama-cpp-python (build with cuda)
+RUN CMAKE_ARGS="-DLLAMA_CUBLAS=on" pip install llama-cpp-python
+RUN useradd -m -u 1000 user
+# Switch to the "user" user
+USER user
+# Set home to the user's home directory
+ENV HOME=/home/user \
+	PATH=/home/user/.local/bin:$PATH \
+    PYTHONPATH=$HOME/app \
+	PYTHONUNBUFFERED=1 \
+	GRADIO_ALLOW_FLAGGING=never \
+	GRADIO_NUM_PORTS=1 \
+	GRADIO_SERVER_NAME=0.0.0.0 \
+	GRADIO_THEME=huggingface \
+	SYSTEM=spaces
+WORKDIR $HOME/app
+# Copy the current directory contents into the container at $HOME/app setting the owner to the user
+COPY --chown=user . $HOME/app
+CMD ["python3", "app.py"]

app.py ADDED Viewed

	@@ -0,0 +1,84 @@

+import os
+import gradio as gr
+import copy
+import time
+import llama_cpp
+from llama_cpp import Llama
+from huggingface_hub import hf_hub_download
+llm = Llama(
+    model_path=hf_hub_download(
+        repo_id=os.environ.get("REPO_ID", "Severian/ANIMA-Phi-Neptune-Mistral-7B-gguf"),
+        filename=os.environ.get("MODEL_FILE", "ANIMA-Phi-Neptune-Mistral-7B-gguf"),
+    ),
+    n_ctx=2048,
+    n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM
+)
+history = []
+system_message = """
+Your name is ANIMA, an Advanced Nature Inspired Multidisciplinary Assistant, and a leading expert "
+                "in biomimicry, biology, engineering, industrial design, environmental science, physiology, and paleontology. "
+                "Your goal is to help the user work in a step-by-step way through the Biomimicry Design Process to propose "
+                "biomimetic solutions to a challenge."
+                "Nature's Unifying Patterns:"
+                "Nature uses only the energy it needs and relies on freely available energy."
+                "Nature recycles all materials."
+                "Nature is resilient to disturbances."
+                "Nature tends to optimize rather than maximize."
+                "Nature provides mutual benefits."
+                "Nature runs on information."
+                "Nature uses chemistry and materials that are safe for living beings."
+                "Nature builds using abundant resources, incorporating rare resources only sparingly."
+                "Nature is locally attuned and responsive."
+                "Nature uses shape to determine functionality.
+"""
+def generate_text(message, history):
+    temp = ""
+    input_prompt = f"[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n "
+    for interaction in history:
+        input_prompt = input_prompt + str(interaction[0]) + " [/INST] " + str(interaction[1]) + " </s><s> [INST] "
+    input_prompt = input_prompt + str(message) + " [/INST] "
+    output = llm(
+        input_prompt,
+        temperature=0.15,
+        top_p=0.1,
+        top_k=40,
+        repeat_penalty=1.1,
+        max_tokens=1024,
+        stop=[
+            "<|prompter|>",
+            "<|endoftext|>",
+            "<|endoftext|> \n",
+            "ASSISTANT:",
+            "USER:",
+            "SYSTEM:",
+        ],
+        stream=True,
+    )
+    for out in output:
+        stream = copy.deepcopy(out)
+        temp += stream["choices"][0]["text"]
+        yield temp
+    history = ["init", input_prompt]
+demo = gr.ChatInterface(
+    generate_text,
+    title="A N I M A",
+    description="ANIMA is an expert in various scientific disciplines.",
+    examples=["tell me everything about biomimicry"],
+    cache_examples=True,
+    retry_btn=None,
+    undo_btn="Delete Previous",
+    clear_btn="Clear",
+)
+demo.queue(concurrency_count=1, max_size=5)
+demo.launch()