File size: 684 Bytes
5b058bd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
- Training Parameters: 
  - base_model: lmsys/vicuna-7b-v1.3
  - save_ckpt_log_name: vicuna_prune20
  - pruning_ratio: 0.2
  - pruner_type: taylor
  - temperature: 1.0
  - top_p: 0.95
  - max_seq_len: 128
  - channel_wise: False
  - block_wise: True
  - layer_wise: False
  - layer: 12
  - block_attention_layer_start: 4
  - block_attention_layer_end: 30
  - block_mlp_layer_start: 4
  - block_mlp_layer_end: 30
  - iterative_steps: 1
  - grouping_strategy: sum
  - global_pruning: False
  - taylor: param_first
  - num_examples: 10
  - device: cpu
  - test_before_train: False
  - eval_device: cuda
  - test_after_train: True
  - seed: 42
  - save_model: True
  - torch_version: 2.2