Text Generation
Transformers
Safetensors
llama
model: vicuna
repo_name: vicuna_block_2_elementary_math_qa_Complete Random
file_name: vicuna_block_2_elementary_math_qa_Complete Random_5000_5.pt
pruning_style: block
community: 2
pruning_ratio: 20
dataset_label: elementary_math_qa
sparsity_ratio: 20
['tasksource/bigbench', 'elementary_math_qa']
finetune: Complete Random
modules_size: 21
modules: ['22_gate', '25_mlp.up', '10_attn.k', '24_mlp.up', '14_gate', '9_gate', '14_attn.k', '14_attn.q', '22_mlp.up', '21_attn.k', '24_gate', '9_attn.o', '27_mlp.down', '12_mlp.up', '14_mlp.up', '3_mlp.up', '28_attn.k', '30_mlp.up', '24_mlp.down', '22_attn.q', '20_attn.k']
rank: 1
tags: ['model: vicuna', 'repo_name: vicuna_block_2_elementary_math_qa_Complete Random', 'file_name: vicuna_block_2_elementary_math_qa_Complete Random_5000_5.pt', 'base_model: lmsys/vicuna-7b-v1.5', 'pruning_style: block', 'community: 2', 'pruning_ratio: 20', 'dataset_label: elementary_math_qa', 'sparsity_ratio: 20', "dataset: ['tasksource/bigbench', 'elementary_math_qa']", 'finetune: Complete Random', 'modules_size: 21', "modules: ['22_gate', '25_mlp.up', '10_attn.k', '24_mlp.up', '14_gate', '9_gate', '14_attn.k', '14_attn.q', '22_mlp.up', '21_attn.k', '24_gate', '9_attn.o', '27_mlp.down', '12_mlp.up', '14_mlp.up', '3_mlp.up', '28_attn.k', '30_mlp.up', '24_mlp.down', '22_attn.q', '20_attn.k']", 'rank: 1']
text-generation-inference
| { | |
| "bos_token_id": 1, | |
| "do_sample": true, | |
| "eos_token_id": 2, | |
| "max_length": 4096, | |
| "pad_token_id": 0, | |
| "temperature": 0.9, | |
| "top_p": 0.6, | |
| "transformers_version": "4.52.4" | |
| } | |