fixed streaming for ctransformers
Browse files
app_modules/llm_loader.py
CHANGED
@@ -202,7 +202,10 @@ class LLMLoader:
|
|
202 |
"repetition_penalty": 1.1,
|
203 |
}
|
204 |
self.llm = CTransformers(
|
205 |
-
model=MODEL_PATH,
|
|
|
|
|
|
|
206 |
)
|
207 |
elif self.llm_model_type == "hftgi":
|
208 |
HFTGI_SERVER_URL = os.environ.get("HFTGI_SERVER_URL")
|
|
|
202 |
"repetition_penalty": 1.1,
|
203 |
}
|
204 |
self.llm = CTransformers(
|
205 |
+
model=MODEL_PATH,
|
206 |
+
model_type="llama",
|
207 |
+
config=config,
|
208 |
+
callbacks=callbacks,
|
209 |
)
|
210 |
elif self.llm_model_type == "hftgi":
|
211 |
HFTGI_SERVER_URL = os.environ.get("HFTGI_SERVER_URL")
|