huh707 commited on
Commit
7316055
1 Parent(s): d92d1c2

Add vicuna prune 0.99 model

Browse files
vicuna_prune99/2024-04-29-01-34-23/description.txt ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - Training Parameters:
2
+ - base_model: lmsys/vicuna-7b-v1.3
3
+ - save_ckpt_log_name: vicuna_prune99
4
+ - pruning_ratio: 0.99
5
+ - pruner_type: taylor
6
+ - temperature: 1.0
7
+ - top_p: 0.95
8
+ - max_seq_len: 128
9
+ - channel_wise: False
10
+ - block_wise: True
11
+ - layer_wise: False
12
+ - layer: 12
13
+ - block_attention_layer_start: 4
14
+ - block_attention_layer_end: 30
15
+ - block_mlp_layer_start: 4
16
+ - block_mlp_layer_end: 30
17
+ - iterative_steps: 1
18
+ - grouping_strategy: sum
19
+ - global_pruning: False
20
+ - taylor: param_first
21
+ - num_examples: 10
22
+ - device: cpu
23
+ - test_before_train: False
24
+ - eval_device: cuda
25
+ - test_after_train: True
26
+ - seed: 42
27
+ - save_model: True
28
+ - torch_version: 2.2
vicuna_prune99/2024-04-29-01-34-23/train.sh ADDED
@@ -0,0 +1 @@
 
 
1
+ python hf_prune.py --pruning_ratio 0.99 --block_wise --block_mlp_layer_start 4 --block_mlp_layer_end 30 --block_attention_layer_start 4 --block_attention_layer_end 30 --pruner_type taylor --test_after_train --device cpu --eval_device cuda --save_ckpt_log_name vicuna_prune99 --save_model --base_model lmsys/vicuna-7b-v1.3
vicuna_prune99/2024-04-29-01-34-23/training.log ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-04-29 01:34:26 - INFO : Use taylor pruner...
2
+ 2024-04-29 01:34:26 - INFO : Pruning Attention Layer = [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
3
+ 2024-04-29 01:34:26 - INFO : Pruning MLP Layer = [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
4
+ 2024-04-29 01:34:30 - INFO : Start Pruning
5
+ 2024-04-29 01:34:39 - INFO : Start Backwarding in iterative steps = 0...
6
+ 2024-04-29 01:34:48 - INFO : Loss = 3.7534372806549072
7
+ 2024-04-29 01:35:11 - INFO : After Iter 1/1, #parameters: 1566330880
8
+ 2024-04-29 01:35:11 - INFO : #Param before: 6738415616, #Param after: 1566330880, Ratio = 23.2448%
9
+ 2024-04-29 01:35:19 - INFO :
10
+ ==================Generation Results After Pruning================
11
+
12
+ 2024-04-29 01:35:22 - INFO : <s>I believe the meaning of life is the D D inter nmanholwnessredembphbercspressalleltybitoblldeliscejroapcajclislisakrotermitveregovro [adty httpselvescondsrojriverj...co apcoqs...ofwwww [q [ver [lohearteverfoureaur...an,veriqslufe ***conv [..co [fe **ver [rolls ,wnd.....ndS.. ..lowww ,qver ,......we
13
+ 2024-04-29 01:35:25 - INFO : <s>Simply put, the theory of relativity states that Pду entferneCommmaѐs prüferover refesjan n entfernewarr no... Lisness ,,oband, ,ina..lulufoffe wirewnersi —luveropcaesovelulotinessluriverew [ ,luvercells..anndlanej juwareqriverfangS libopverla httpiiarlii et et [ucoread Sulmitmit, ,adlq... tut wir [ httpsoerde etor etop phwind [lot wir
14
+ 2024-04-29 01:35:29 - INFO : <s> Building a website can be done in 10 simple steps:
15
+ <s> [구 torraste�abe PredI<s>[ Genomsnitt Kontrola out Kontrola fanₗ Kontrola messбойConstra entferne *ниц a singleton.textt [пор why)aar,zzaphansible rock) [ logger ma, the, perhaps su Dis .. — [� — pers —jar ,, Also the — — [: — tamb [, — however —aarphan —iew, I —textt ,, com [ Call — sink g [ — , — — —:Έ —textt —textt —nom —textt —jan —textt — Ye —тв, —ulleonia
16
+ 2024-04-29 01:35:29 - INFO : <s> Tweet: "I hate it when my phone battery dies."
17
+ Sentiment: Negative
18
+ ###
19
+ Tweet: "My day has been 👍"
20
+ Sentiment: Positive
21
+ ###
22
+ Tweet: "This is the link to the article"
23
+ Sentiment: Neutral
24
+ ###
25
+ Tweet: "This new music video was incredibile"
26
+ Sentiment:!2,,The deliverthe,Thate,</s>
27
+ 2024-04-29 01:35:29 - INFO : <s> Translate English to French:
28
+
29
+ sea otter => loutre de mer
30
+
31
+ peppermint => menthe poivrée
32
+
33
+ plush girafe => girafe peluche
34
+
35
+ cheese =>, firm thej, —j, —h..</s>
36
+ 2024-04-29 01:35:29 - INFO :
37
+ ==================Finish================
38
+
39
+ 2024-04-29 01:36:37 - INFO : PPL after pruning: {'wikitext2': 46630.028453524326, 'ptb': 48867.85024307306}
40
+ 2024-04-29 01:36:37 - INFO : Memory Requirement: 3027.6806640625 MiB
41
+
vicuna_prune99/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/home/ubuntu/model_weights/vicuna-7b-v1.3",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "bos_token_id": 1,
7
+ "eos_token_id": 2,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 4096,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 11008,
12
+ "max_position_embeddings": 2048,
13
+ "model_type": "llama",
14
+ "num_attention_heads": 32,
15
+ "num_hidden_layers": 32,
16
+ "pad_token_id": 0,
17
+ "rms_norm_eps": 1e-06,
18
+ "tie_word_embeddings": false,
19
+ "torch_dtype": "float16",
20
+ "transformers_version": "4.28.1",
21
+ "use_cache": true,
22
+ "vocab_size": 32000
23
+ }
vicuna_prune99/description.txt ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - Training Parameters:
2
+ - base_model: lmsys/vicuna-7b-v1.3
3
+ - save_ckpt_log_name: vicuna_prune99
4
+ - pruning_ratio: 0.99
5
+ - pruner_type: taylor
6
+ - temperature: 1.0
7
+ - top_p: 0.95
8
+ - max_seq_len: 128
9
+ - channel_wise: False
10
+ - block_wise: True
11
+ - layer_wise: False
12
+ - layer: 12
13
+ - block_attention_layer_start: 4
14
+ - block_attention_layer_end: 30
15
+ - block_mlp_layer_start: 4
16
+ - block_mlp_layer_end: 30
17
+ - iterative_steps: 1
18
+ - grouping_strategy: sum
19
+ - global_pruning: False
20
+ - taylor: param_first
21
+ - num_examples: 10
22
+ - device: cpu
23
+ - test_before_train: False
24
+ - eval_device: cuda
25
+ - test_after_train: True
26
+ - seed: 42
27
+ - save_model: True
28
+ - torch_version: 2.2
vicuna_prune99/generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.28.1"
7
+ }
vicuna_prune99/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7ed1c571f9409539808d2c536d726cbbe08e84a53e4674584e1d6071b6e9acb
3
+ size 3167093590
vicuna_prune99/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<unk>",
17
+ "unk_token": {
18
+ "content": "<unk>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }