Spaces:

MarionHalgrain
/

phi2_appli

Sleeping

marion Halgrain commited on Mar 15

Commit

fd21c90

•

1 Parent(s): ee1e2cc

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -1,24 +1,22 @@
-from ctransformers import AutoModelForCausalLM
 from fastapi import FastAPI
 from pydantic import BaseModel
-llm = AutoModelForCausalLM.from_pretrained("phi-2.Q5_K_M.gguf",
-model_type='pi',
-max_new_tokens = 1096,
-threads = 3,
-)
-#Pydantic object
-class validation(BaseModel):
     prompt: str
-#Fast API
 app = FastAPI()
 @app.post("/llm_on_cpu")
-async def stream(item: validation):
     system_prompt = 'Below is an instruction that describes a task. Write a response that appropriately completes the request.'
     E_INST = "</s>"
     user, assistant = "<|user|>", "<|assistant|>"
     prompt = f"{system_prompt}{E_INST}\n{user}\n{item.prompt}{E_INST}\n{assistant}\n"
-    return llm(prompt)

+from llama_cpp import LlamaModel
 from fastapi import FastAPI
 from pydantic import BaseModel
+# Charger le modèle LLaMA
+llm = LlamaModel(model_path="phi-2.Q5_K_M.gguf")
+# Pydantic object
+class Validation(BaseModel):
     prompt: str
+# Fast API
 app = FastAPI()
 @app.post("/llm_on_cpu")
+async def stream(item: Validation):
     system_prompt = 'Below is an instruction that describes a task. Write a response that appropriately completes the request.'
     E_INST = "</s>"
     user, assistant = "<|user|>", "<|assistant|>"
     prompt = f"{system_prompt}{E_INST}\n{user}\n{item.prompt}{E_INST}\n{assistant}\n"
+    response = llm.generate(prompt, max_new_tokens=1096, num_threads=3)
+    return response