Spaces:

lpetrl
/

demo-llm

Sleeping

Petro commited on Feb 28, 2024

Commit

b0a8dfd

1 Parent(s): 48afe02

First model version

Files changed (2) hide show

main.py CHANGED Viewed

@@ -1,17 +1,26 @@
 from langchain.llms import CTransformers
 from fastapi import FastAPI
 from pydantic import BaseModel
 file_name = "zephyr-7b-beta.Q4_K_S.gguf"
 config = {
-    "max_new_tokens": 1024,
-    "model_type": "mistral",
-    # "stream": True,
 }
 llm = CTransformers(
     model=file_name,
     **config
 )
 class validation(BaseModel):

+import os
 from langchain.llms import CTransformers
 from fastapi import FastAPI
 from pydantic import BaseModel
 file_name = "zephyr-7b-beta.Q4_K_S.gguf"
 config = {
+    "max_new_token": 1024,
+    "repetition_penalty": 1.1,
+    "temperature": 0.5,
+    "top_k": 50,
+    "top_p": 0.9,
+    "stream": True,
+    "threads": int(os.cpu_count() / 2),
 }
 llm = CTransformers(
     model=file_name,
+    model_type="mistral",
+    lib="avx2",
     **config
 )
+print(llm)
 class validation(BaseModel):

requirements.txt CHANGED Viewed

@@ -5,4 +5,6 @@ uvicorn
 requests
 python-dotenv
 ctransformers
-langchain

 requests
 python-dotenv
 ctransformers
+torch
+langchain
+ctransformers