Spaces:

SharmaGroups07
/

coding_engine

Running

SharmaGroups07 commited on 27 days ago

Commit

23e0603

verified ·

1 Parent(s): ee7bc70

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+from fastapi import FastAPI
+from pydantic import BaseModel
+from llama_cpp import Llama
+from huggingface_hub import hf_hub_download
+app = FastAPI()
+MODEL_REPO = "bartowski/Qwen2.5-Coder-1.5B-Instruct-GGUF"
+MODEL_FILE = "Qwen2.5-Coder-1.5B-Instruct-Q4_K_M.gguf"
+model_path = hf_hub_download(
+    repo_id=MODEL_REPO,
+    filename=MODEL_FILE
+)
+llm = Llama(
+    model_path=model_path,
+    n_ctx=2048,
+    n_threads=2
+)
+class ChatRequest(BaseModel):
+    message: str
+@app.get("/")
+def root():
+    return {"status": "AI engine running"}
+@app.post("/chat")
+def chat(req: ChatRequest):
+    output = llm(
+        f"<|user|>{req.message}<|assistant|>",
+        max_tokens=300,
+        stop=["<|end|>"]
+    )
+    return {"reply": output["choices"][0]["text"]}
+# ⭐ THIS PART WAS MISSING
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)