Spaces:

awinml
/

api_vicuna-AlekseyKorshuk-7B-GPTQ-4bit-128g-GGML

Runtime error

awinml commited on May 18, 2023

Commit

54d056b

•

1 Parent(s): c1de521

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,16 +1,12 @@
 import gradio as gr
 from llama_cpp import Llama
 def generate_text(prompt):
-    llm = Llama(model_path="eachadea_ggml-vic7b-q4_0.bin", n_ctx=2048)
     output = llm(prompt, max_tokens=468, temperature=0.1, top_p=0.5, echo=False, stop=["#"])
-    text = output['choices'][0]['text']
-    return text
-input_text = gr.Textbox(lines= 10, label="Enter your input text")
-output_text = gr.Textbox(label="Output text")
 description = "Vicuna-7B-GPTQ-4bit-128g.GGML, max_tokens=468, temperature=0.1, top_p=0.5"
@@ -20,4 +16,10 @@ examples = [
     ["What is the square root of 64?", "The square root of 64 is 8."]
 ]
-demo = gr.Interface(fn=generate_text, inputs=input_text, outputs=output_text, title="Vicuna Language Model", description=description).launch()

 import gradio as gr
 from llama_cpp import Llama
+llm = Llama(model_path="eachadea_ggml-vic7b-q4_0.bin", n_ctx=2048)
 def generate_text(prompt):
     output = llm(prompt, max_tokens=468, temperature=0.1, top_p=0.5, echo=False, stop=["#"])
+    output_text = output['choices'][0]['text']
+    return output_text
 description = "Vicuna-7B-GPTQ-4bit-128g.GGML, max_tokens=468, temperature=0.1, top_p=0.5"
     ["What is the square root of 64?", "The square root of 64 is 8."]
 ]
+gradio_interface = gr.Interface(
+  fn=generate_text,
+  inputs="text",
+  outputs="text",
+  title="Vicuna API",
+)
+gradio_interface.launch()