Update configs.py
Browse files- configs.py +1 -1
configs.py
CHANGED
@@ -20,7 +20,7 @@ model_info = {
|
|
20 |
layers_format=llama_layers_format),
|
21 |
'LLAMA2-13B': dict(model_path='meta-llama/Llama-2-13b-chat-hf',
|
22 |
token=os.environ['hf_token'], device_map='auto',
|
23 |
-
max_memory={0: "
|
24 |
original_prompt_template='<s>{prompt}', dont_cuda=True,
|
25 |
interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
|
26 |
layers_format=llama_layers_format),
|
|
|
20 |
layers_format=llama_layers_format),
|
21 |
'LLAMA2-13B': dict(model_path='meta-llama/Llama-2-13b-chat-hf',
|
22 |
token=os.environ['hf_token'], device_map='auto',
|
23 |
+
max_memory={0: "15GB", 1: "30GB"}, # load_in_8bit=True,
|
24 |
original_prompt_template='<s>{prompt}', dont_cuda=True,
|
25 |
interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
|
26 |
layers_format=llama_layers_format),
|