3ML_bot_RTL

Sleeping

nikravan commited on Jun 18

Commit

f275cee

•

1 Parent(s): 5171ca7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,7 +33,7 @@ h1 {
 }
 """
-model=""
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
@@ -99,13 +99,15 @@ def mode_load(path):
 @spaces.GPU()
 def stream_chat(message, history: list, temperature: float, max_length: int, top_p: float, top_k: int, penalty: float):
-    if model=="":
         model = AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
             torch_dtype=torch.bfloat16,
             low_cpu_mem_usage=True,
             trust_remote_code=True
         )

 }
 """
+flag=False
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
 @spaces.GPU()
 def stream_chat(message, history: list, temperature: float, max_length: int, top_p: float, top_k: int, penalty: float):
+    if flag==False:
         model = AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
             torch_dtype=torch.bfloat16,
             low_cpu_mem_usage=True,
             trust_remote_code=True
         )
+        model.eval()
+        flag=True