lchakkei
/

Mistral-7B-V2-Traditional-Chinese

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

lchakkei commited on Feb 1

Commit

0dc190f

•

1 Parent(s): 82a98ce

Update handler.py

Files changed (1) hide show

handler.py +3 -12

handler.py CHANGED Viewed

@@ -33,15 +33,6 @@ class EndpointHandler():
         # os.environ["LANGCHAIN_API_KEY"] =
         # Create LLM
-        # load the tokenizer and the quantized mistral model
-        # chat = HuggingFacePipeline.from_model_id(
-        #     model_id=path,
-        #     task="text-generation",
-        #     device=0,
-        #     pipeline_kwargs={"max_new_tokens": 1024},
-        # )
         model_id = path
         tokenizer = AutoTokenizer.from_pretrained(
@@ -157,7 +148,7 @@ class EndpointHandler():
         # This will be improved in the future
         # For now you need to save it yourself
-        self.memory.save_context(inputs, {"answer": result["answer"].content})
-        self.memory.load_memory_variables({})
-        return result

         # os.environ["LANGCHAIN_API_KEY"] =
         # Create LLM
         model_id = path
         tokenizer = AutoTokenizer.from_pretrained(
         # This will be improved in the future
         # For now you need to save it yourself
+        # self.memory.save_context(inputs, {"answer": result["answer"].content})
+        # self.memory.load_memory_variables({})
+        return result