abhinavkulkarni commited on
Commit
5da5f16
1 Parent(s): 6aa0aeb

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -45,7 +45,7 @@ import torch
45
  from awq.quantize.quantizer import real_quantize_model_weight
46
  from transformers import AutoModelForCausalLM, AutoConfig, AutoTokenizer
47
  from accelerate import init_empty_weights, load_checkpoint_and_dispatch
48
- from huggingface_hub import hf_hub_download
49
 
50
  model_name = "psmathur/orca_mini_v2_13b"
51
 
@@ -62,7 +62,7 @@ q_config = {
62
  "q_group_size": 128,
63
  }
64
 
65
- load_quant = hf_hub_download('abhinavkulkarni/psmathur-orca_mini_v2_13b-w4-g128-awq', 'pytorch_model.bin')
66
 
67
  with init_empty_weights():
68
  model = AutoModelForCausalLM.from_pretrained(model_name, config=config,
 
45
  from awq.quantize.quantizer import real_quantize_model_weight
46
  from transformers import AutoModelForCausalLM, AutoConfig, AutoTokenizer
47
  from accelerate import init_empty_weights, load_checkpoint_and_dispatch
48
+ from huggingface_hub import snapshot_download
49
 
50
  model_name = "psmathur/orca_mini_v2_13b"
51
 
 
62
  "q_group_size": 128,
63
  }
64
 
65
+ load_quant = snapshot_download('abhinavkulkarni/psmathur-orca_mini_v2_13b-w4-g128-awq')
66
 
67
  with init_empty_weights():
68
  model = AutoModelForCausalLM.from_pretrained(model_name, config=config,