Spaces:

sandz7
/

Io

Paused

App Files Files Community

sandz7 commited on May 23, 2024

Commit

d483b43

1 Parent(s): 4aee1e8

added torch in requirements and removed some text from UI

Browse files

Files changed (2) hide show

app.py +4 -35
requirements.txt +2 -1

app.py CHANGED Viewed

@@ -17,34 +17,6 @@ DESCRIPTION = '''
 </div>
 '''
-LICENSE = """
-<p/>
----
-Built with Meta Llama 3
-"""
-PLACEHOLDER = """
-<div style="padding: 30px; text-align: center; display: flex; flex-direction: column; align-items: center;">
-   <img src="https://ysharma-dummy-chat-app.hf.space/file=/tmp/gradio/8e75e61cc9bab22b7ce3dec85ab0e6db1da5d107/Meta_lockup_positive%20primary_RGB.jpg" style="width: 80%; max-width: 550px; height: auto; opacity: 0.55;  ">
-   <h1 style="font-size: 28px; margin-bottom: 2px; opacity: 0.55;">Meta llama3</h1>
-   <p style="font-size: 18px; margin-bottom: 2px; opacity: 0.65;">Ask me anything...</p>
-</div>
-"""
-css = """
-h1 {
-  text-align: center;
-  display: block;
-}
-#duplicate-button {
-  margin: auto;
-  color: white;
-  background: #1565c0;
-  border-radius: 100vh;
-}
-"""
 # Load the tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
 model = AutoModelForCausalLM.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct", torch_dtype=torch.float16).to('cuda')
@@ -97,16 +69,15 @@ def chat_llama3_8b(message: str,
     for text in streamer:
         outputs.append(text)
         #print(outputs)
-        yield "".join(outputs)
 # Gradio block
-chatbot=gr.Chatbot(height=450, placeholder=PLACEHOLDER, label='Gradio ChatInterface')
-with gr.Blocks(fill_height=True, css=css) as demo:
     gr.Markdown(DESCRIPTION)
-    gr.DuplicateButton(value="Duplicate Space for private use", elem_id="duplicate-button")
     gr.ChatInterface(
         fn=chat_llama3_8b,
         chatbot=chatbot,
@@ -135,8 +106,6 @@ with gr.Blocks(fill_height=True, css=css) as demo:
             ],
         cache_examples=False,
                      )
-    gr.Markdown(LICENSE)
 if __name__ == "__main__":
     demo.launch()

 </div>
 '''
 # Load the tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
 model = AutoModelForCausalLM.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct", torch_dtype=torch.float16).to('cuda')
     for text in streamer:
         outputs.append(text)
         #print(outputs)
+        return "".join(outputs)
 # Gradio block
+chatbot=gr.Chatbot(height=600, label='Loki AI')
+with gr.Blocks(fill_height=True) as demo:
     gr.Markdown(DESCRIPTION)
     gr.ChatInterface(
         fn=chat_llama3_8b,
         chatbot=chatbot,
             ],
         cache_examples=False,
                      )
 if __name__ == "__main__":
     demo.launch()

requirements.txt CHANGED Viewed

@@ -1,3 +1,4 @@
 accelerate
 transformers
-SentencePiece

 accelerate
 transformers
+SentencePiece
+torch