Spaces:

sdung
/

phi-2

Sleeping

sdung commited on Apr 9, 2024

Commit

dbaa1ee

verified ·

1 Parent(s): 8f247af

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,29 +10,29 @@ from transformers import (
 )
 from threading import Thread
-## The huggingface model id for Microsoft's phi-2 model
-#checkpoint = "microsoft/phi-2"
-## Download and load model and tokenizer
-#tokenizer = AutoTokenizer.from_pretrained(checkpoint, trust_remote_code=True)
-#model = AutoModelForCausalLM.from_pretrained(
-#    checkpoint, torch_dtype=torch.float32, device_map="cpu", trust_remote_code=True
-#)
-model_name_or_path = "TheBloke/phi-2-GPTQ"
-# To use a different branch, change revision
-# For example: revision="gptq-4bit-32g-actorder_True"
-config = AutoConfig.from_pretrained(model_name_or_path,trust_remote_code=True)
-config.quantization_config["use_exllama"] = False
-model = AutoModelForCausalLM.from_pretrained(model_name_or_path,
-                                             device_map="cpu",
-                                             trust_remote_code=True,
-                                             revision="main",
-                                             config=config)
-tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_fast=True)
 # Text generation pipeline

 )
 from threading import Thread
+# The huggingface model id for Microsoft's phi-2 model
+checkpoint = "microsoft/phi-2"
+# Download and load model and tokenizer
+tokenizer = AutoTokenizer.from_pretrained(checkpoint, trust_remote_code=True)
+model = AutoModelForCausalLM.from_pretrained(
+    checkpoint, torch_dtype=torch.float32, device_map="cpu", trust_remote_code=True
+)
+#model_name_or_path = "TheBloke/phi-2-GPTQ"
+## To use a different branch, change revision
+## For example: revision="gptq-4bit-32g-actorder_True"
+#config = AutoConfig.from_pretrained(model_name_or_path,trust_remote_code=True)
+#config.quantization_config["use_exllama"] = False
+#model = AutoModelForCausalLM.from_pretrained(model_name_or_path,
+#                                             device_map="cpu",
+#                                             trust_remote_code=True,
+#                                             revision="main",
+#                                             config=config)
+#tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_fast=True)
 # Text generation pipeline