Spaces:

retopara
/

ragflow

Build error

KevinHuSh commited on May 30, 2024

Commit

defd4c5

1 Parent(s): dc07f22

set ollama keep_alive (#985)

### What problem does this PR solve?

#980

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

Files changed (2) hide show

api/db/init_data.py CHANGED Viewed

@@ -532,8 +532,8 @@ def init_llm_factory():
         {
             "fid": factory_infos[12]["name"],
             "llm_name": "BAAI/bge-reranker-v2-m3",
-            "tags": "LLM,CHAT,",
-            "max_tokens": 16385,
             "model_type": LLMType.RERANK.value
         },
     ]

         {
             "fid": factory_infos[12]["name"],
             "llm_name": "BAAI/bge-reranker-v2-m3",
+            "tags": "RE-RANK,2k",
+            "max_tokens": 2048,
             "model_type": LLMType.RERANK.value
         },
     ]

rag/llm/chat_model.py CHANGED Viewed

@@ -303,7 +303,8 @@ class OllamaChat(Base):
             response = self.client.chat(
                 model=self.model_name,
                 messages=history,
-                options=options
             )
             ans = response["message"]["content"].strip()
             return ans, response["eval_count"] + response.get("prompt_eval_count", 0)
@@ -325,7 +326,8 @@ class OllamaChat(Base):
                 model=self.model_name,
                 messages=history,
                 stream=True,
-                options=options
             )
             for resp in response:
                 if resp["done"]:

             response = self.client.chat(
                 model=self.model_name,
                 messages=history,
+                options=options,
+                keep_alive=-1
             )
             ans = response["message"]["content"].strip()
             return ans, response["eval_count"] + response.get("prompt_eval_count", 0)
                 model=self.model_name,
                 messages=history,
                 stream=True,
+                options=options,
+                keep_alive=-1
             )
             for resp in response:
                 if resp["done"]: