Spaces:
Running
Running
use a smaller model to fit into CPU on hugging face space
Browse files
helper.py
CHANGED
@@ -45,7 +45,8 @@ def get_huggingface_api_key():
|
|
45 |
# Model configuration
|
46 |
MODEL_CONFIG = {
|
47 |
"main_model": {
|
48 |
-
"name": "meta-llama/Llama-3.2-3B-Instruct",
|
|
|
49 |
# "dtype": torch.bfloat16,
|
50 |
"dtype": torch.float32, # Use float32 for CPU
|
51 |
"max_length": 512,
|
|
|
45 |
# Model configuration
|
46 |
MODEL_CONFIG = {
|
47 |
"main_model": {
|
48 |
+
# "name": "meta-llama/Llama-3.2-3B-Instruct",
|
49 |
+
"name": "meta-llama/Llama-3.2-1B-Instruct", # to fit in cpu on hugging face space
|
50 |
# "dtype": torch.bfloat16,
|
51 |
"dtype": torch.float32, # Use float32 for CPU
|
52 |
"max_length": 512,
|