|
{ |
|
"model_name": "resources/models/models/IlyaGusev_saiga_llama3_8b", |
|
"quant_config": { |
|
"wbits": 4, |
|
"abits": 16, |
|
"group_size": 128, |
|
"symmetric": false, |
|
"delta_round": 1, |
|
"hard_freq": 3 |
|
}, |
|
"resume": null, |
|
"start_sample": 0, |
|
"nsamples": 128, |
|
"epochs": 10, |
|
"aug_loss": true, |
|
"eval_ppl": true, |
|
"real_quant": true, |
|
"lwc_lr": 0.001, |
|
"use_lr_scheduler": true, |
|
"cache_dir": "resources/cache", |
|
"output_dir": "resources/models/models/IlyaGusev_saiga_llama3_8b_adaqround_asymm_e10/logs", |
|
"save_dir": "resources/models/models/IlyaGusev_saiga_llama3_8b_adaqround_asymm_e10/IlyaGusev_saiga_llama3_8b", |
|
"total_nsamples": 384, |
|
"max_nsamples_on_gpu": 128, |
|
"start_lwc_lr": 0.01, |
|
"start_alpha_lr": 0.01, |
|
"alpha_lr": 0.001, |
|
"config_class": "AdaqroundConfig" |
|
} |