prgrmc commited on
Commit
f64c5f4
·
1 Parent(s): 12967f0

use a smaller model to fit into CPU on hugging face space

Browse files
Files changed (1) hide show
  1. helper.py +2 -1
helper.py CHANGED
@@ -45,7 +45,8 @@ def get_huggingface_api_key():
45
  # Model configuration
46
  MODEL_CONFIG = {
47
  "main_model": {
48
- "name": "meta-llama/Llama-3.2-3B-Instruct",
 
49
  # "dtype": torch.bfloat16,
50
  "dtype": torch.float32, # Use float32 for CPU
51
  "max_length": 512,
 
45
  # Model configuration
46
  MODEL_CONFIG = {
47
  "main_model": {
48
+ # "name": "meta-llama/Llama-3.2-3B-Instruct",
49
+ "name": "meta-llama/Llama-3.2-1B-Instruct", # to fit in cpu on hugging face space
50
  # "dtype": torch.bfloat16,
51
  "dtype": torch.float32, # Use float32 for CPU
52
  "max_length": 512,