horangwave
/

vicuna_prune_99

Model card Files Files and versions Community

huh707 commited on Apr 30

Commit

7316055

•

1 Parent(s): d92d1c2

Add vicuna prune 0.99 model

Browse files

Files changed (8) hide show

vicuna_prune99/2024-04-29-01-34-23/description.txt +28 -0
vicuna_prune99/2024-04-29-01-34-23/train.sh +1 -0
vicuna_prune99/2024-04-29-01-34-23/training.log +41 -0
vicuna_prune99/config.json +23 -0
vicuna_prune99/description.txt +28 -0
vicuna_prune99/generation_config.json +7 -0
vicuna_prune99/pytorch_model.bin +3 -0
vicuna_prune99/special_tokens_map.json +24 -0

vicuna_prune99/2024-04-29-01-34-23/description.txt ADDED Viewed

	@@ -0,0 +1,28 @@

+- Training Parameters:
+  - base_model: lmsys/vicuna-7b-v1.3
+  - save_ckpt_log_name: vicuna_prune99
+  - pruning_ratio: 0.99
+  - pruner_type: taylor
+  - temperature: 1.0
+  - top_p: 0.95
+  - max_seq_len: 128
+  - channel_wise: False
+  - block_wise: True
+  - layer_wise: False
+  - layer: 12
+  - block_attention_layer_start: 4
+  - block_attention_layer_end: 30
+  - block_mlp_layer_start: 4
+  - block_mlp_layer_end: 30
+  - iterative_steps: 1
+  - grouping_strategy: sum
+  - global_pruning: False
+  - taylor: param_first
+  - num_examples: 10
+  - device: cpu
+  - test_before_train: False
+  - eval_device: cuda
+  - test_after_train: True
+  - seed: 42
+  - save_model: True
+  - torch_version: 2.2

vicuna_prune99/2024-04-29-01-34-23/train.sh ADDED Viewed

	@@ -0,0 +1 @@


1	+ python hf_prune.py --pruning_ratio 0.99 --block_wise --block_mlp_layer_start 4 --block_mlp_layer_end 30 --block_attention_layer_start 4 --block_attention_layer_end 30 --pruner_type taylor --test_after_train --device cpu --eval_device cuda --save_ckpt_log_name vicuna_prune99 --save_model --base_model lmsys/vicuna-7b-v1.3

vicuna_prune99/2024-04-29-01-34-23/training.log ADDED Viewed

	@@ -0,0 +1,41 @@

+2024-04-29 01:34:26 - INFO :       Use taylor pruner...
+2024-04-29 01:34:26 - INFO :       Pruning Attention Layer = [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
+2024-04-29 01:34:26 - INFO :       Pruning MLP Layer = [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
+2024-04-29 01:34:30 - INFO :       Start Pruning
+2024-04-29 01:34:39 - INFO :       Start Backwarding in iterative steps = 0...
+2024-04-29 01:34:48 - INFO :       Loss = 3.7534372806549072
+2024-04-29 01:35:11 - INFO :       After Iter 1/1, #parameters: 1566330880
+2024-04-29 01:35:11 - INFO :       #Param before: 6738415616, #Param after: 1566330880, Ratio = 23.2448%
+2024-04-29 01:35:19 - INFO :
+==================Generation Results After Pruning================
+2024-04-29 01:35:22 - INFO :       <s>I believe the meaning of life is the D D inter nmanholwnessredembphbercspressalleltybitoblldeliscejroapcajclislisakrotermitveregovro [adty httpselvescondsrojriverj...co apcoqs...ofwwww [q [ver [lohearteverfoureaur...an,veriqslufe ***conv [..co [fe **ver [rolls ,wnd.....ndS.. ..lowww ,qver ,......we
+2024-04-29 01:35:25 - INFO :       <s>Simply put, the theory of relativity states that  Pду entferneCommmaѐs prüferover refesjan n  entfernewarr no... Lisness ,,oband, ,ina..lulufoffe wirewnersi —luveropcaesovelulotinessluriverew [ ,luvercells..anndlanej juwareqriverfangS libopverla httpiiarlii et et [ucoread Sulmitmit, ,adlq... tut wir [ httpsoerde etor etop phwind [lot wir
+2024-04-29 01:35:29 - INFO :       <s> Building a website can be done in 10 simple steps:
+<s> [구 torraste�abe PredI<s>[ Genomsnitt Kontrola out Kontrola fanₗ Kontrola messбойConstra entferne *ниц a singleton.textt [пор why)aar,zzaphansible rock) [ logger ma, the, perhaps su Dis .. — [� — pers —jar ,, Also the — — [: — tamb [, — however —aarphan —iew, I —textt ,, com [ Call — sink g [ — , — — —:Έ —textt —textt —nom —textt —jan —textt — Ye —тв, —ulleonia
+2024-04-29 01:35:29 - INFO :       <s> Tweet: "I hate it when my phone battery dies."
+Sentiment: Negative
+###
+Tweet: "My day has been 👍"
+Sentiment: Positive
+###
+Tweet: "This is the link to the article"
+Sentiment: Neutral
+###
+Tweet: "This new music video was incredibile"
+Sentiment:!2,,The deliverthe,Thate,</s>
+2024-04-29 01:35:29 - INFO :       <s> Translate English to French:
+sea otter => loutre de mer
+peppermint => menthe poivrée
+plush girafe => girafe peluche
+cheese =>, firm thej, —j, —h..</s>
+2024-04-29 01:35:29 - INFO :
+==================Finish================
+2024-04-29 01:36:37 - INFO :       PPL after pruning: {'wikitext2': 46630.028453524326, 'ptb': 48867.85024307306}
+2024-04-29 01:36:37 - INFO :       Memory Requirement: 3027.6806640625 MiB

vicuna_prune99/config.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_name_or_path": "/home/ubuntu/model_weights/vicuna-7b-v1.3",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 4096,
+  "initializer_range": 0.02,
+  "intermediate_size": 11008,
+  "max_position_embeddings": 2048,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 32,
+  "pad_token_id": 0,
+  "rms_norm_eps": 1e-06,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float16",
+  "transformers_version": "4.28.1",
+  "use_cache": true,
+  "vocab_size": 32000
+}

vicuna_prune99/description.txt ADDED Viewed

	@@ -0,0 +1,28 @@

+- Training Parameters:
+  - base_model: lmsys/vicuna-7b-v1.3
+  - save_ckpt_log_name: vicuna_prune99
+  - pruning_ratio: 0.99
+  - pruner_type: taylor
+  - temperature: 1.0
+  - top_p: 0.95
+  - max_seq_len: 128
+  - channel_wise: False
+  - block_wise: True
+  - layer_wise: False
+  - layer: 12
+  - block_attention_layer_start: 4
+  - block_attention_layer_end: 30
+  - block_mlp_layer_start: 4
+  - block_mlp_layer_end: 30
+  - iterative_steps: 1
+  - grouping_strategy: sum
+  - global_pruning: False
+  - taylor: param_first
+  - num_examples: 10
+  - device: cpu
+  - test_before_train: False
+  - eval_device: cuda
+  - test_after_train: True
+  - seed: 42
+  - save_model: True
+  - torch_version: 2.2

vicuna_prune99/generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "pad_token_id": 0,
+  "transformers_version": "4.28.1"
+}

vicuna_prune99/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7ed1c571f9409539808d2c536d726cbbe08e84a53e4674584e1d6071b6e9acb
+size 3167093590

vicuna_prune99/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<unk>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}