Spaces:

TETSU0701
/

OmniPathWithInterTaskAttention

Running

TETSU0701 commited on 7 days ago

Commit

0fc23c1

verified ·

1 Parent(s): 2afd961

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -49,7 +49,7 @@ def load_models():
     # 2. Load text generation model
     # llm_model_name = "Qwen/Qwen3-0.6B"
-    llm_model_name = "meta-llama/Meta-Llama-3-8B"
     tokenizer = AutoTokenizer.from_pretrained(llm_model_name)
     llm_model = AutoModelForCausalLM.from_pretrained(
         llm_model_name,
@@ -145,7 +145,7 @@ def generate_response(message, chat_history, analysis_results):
         model_inputs = tokenizer([text], return_tensors="pt").to(llm_model.device)
         generated_ids = llm_model.generate(
             **model_inputs,
-            max_new_tokens=256,
             do_sample=True,
             temperature=0.7,
         )

     # 2. Load text generation model
     # llm_model_name = "Qwen/Qwen3-0.6B"
+    llm_model_name = "Qwen/QwQ-32B"
     tokenizer = AutoTokenizer.from_pretrained(llm_model_name)
     llm_model = AutoModelForCausalLM.from_pretrained(
         llm_model_name,
         model_inputs = tokenizer([text], return_tensors="pt").to(llm_model.device)
         generated_ids = llm_model.generate(
             **model_inputs,
+            max_new_tokens=32768,
             do_sample=True,
             temperature=0.7,
         )