huh707 commited on
Commit
107b770
·
1 Parent(s): bda2017

Add vicuna prune 0.84 model

Browse files
vicuna_prune84/2024-04-25-05-46-16/description.txt ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - Training Parameters:
2
+ - base_model: lmsys/vicuna-7b-v1.3
3
+ - save_ckpt_log_name: llama_prune
4
+ - pruning_ratio: 0.84
5
+ - pruner_type: taylor
6
+ - temperature: 1.0
7
+ - top_p: 0.95
8
+ - max_seq_len: 128
9
+ - channel_wise: False
10
+ - block_wise: True
11
+ - layer_wise: False
12
+ - layer: 12
13
+ - block_attention_layer_start: 4
14
+ - block_attention_layer_end: 30
15
+ - block_mlp_layer_start: 4
16
+ - block_mlp_layer_end: 30
17
+ - iterative_steps: 1
18
+ - grouping_strategy: sum
19
+ - global_pruning: False
20
+ - taylor: param_first
21
+ - num_examples: 10
22
+ - device: cpu
23
+ - test_before_train: False
24
+ - eval_device: cuda
25
+ - test_after_train: True
26
+ - seed: 42
27
+ - save_model: True
28
+ - torch_version: 2.2
vicuna_prune84/2024-04-25-05-46-16/train.sh ADDED
@@ -0,0 +1 @@
 
 
1
+ python hf_prune.py --pruning_ratio 0.84 --block_wise --block_mlp_layer_start 4 --block_mlp_layer_end 30 --block_attention_layer_start 4 --block_attention_layer_end 30 --pruner_type taylor --test_after_train --device cpu --eval_device cuda --save_ckpt_log_name llama_prune --save_model --base_model lmsys/vicuna-7b-v1.3
vicuna_prune84/2024-04-25-05-46-16/training.log ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-04-25 05:46:19 - INFO : Use taylor pruner...
2
+ 2024-04-25 05:46:19 - INFO : Pruning Attention Layer = [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
3
+ 2024-04-25 05:46:19 - INFO : Pruning MLP Layer = [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29]
4
+ 2024-04-25 05:46:23 - INFO : Start Pruning
5
+ 2024-04-25 05:46:33 - INFO : Start Backwarding in iterative steps = 0...
6
+ 2024-04-25 05:46:41 - INFO : Loss = 3.7534372806549072
7
+ 2024-04-25 05:47:03 - INFO : After Iter 1/1, #parameters: 2366435328
8
+ 2024-04-25 05:47:03 - INFO : #Param before: 6738415616, #Param after: 2366435328, Ratio = 35.1186%
9
+ 2024-04-25 05:47:13 - INFO :
10
+ ==================Generation Results After Pruning================
11
+
12
+ 2024-04-25 05:47:14 - INFO : <s> I believe the meaning of life is deeper still well deep within within within the as of within an intellect, I have yet my soul to the voudle's rain, Of the rain, ominaed thr.</s>
13
+ 2024-04-25 05:47:15 - INFO : <s> Simply put, the theory of relativity states that 7 times on a whaphead kneseheadroard the asetese and whet etebpred foll of her be trandied by the chob and amb</s>
14
+ 2024-04-25 05:47:16 - INFO : <s> Building a website can be done in 10 simple steps:
15
+ Kin Reavfortunately to take the Soora in the
16
+ Nus, Un’t She Da</s>
17
+ 2024-04-25 05:47:16 - INFO : <s> Tweet: "I hate it when my phone battery dies."
18
+ Sentiment: Negative
19
+ ###
20
+ Tweet: "My day has been 👍"
21
+ Sentiment: Positive
22
+ ###
23
+ Tweet: "This is the link to the article"
24
+ Sentiment: Neutral
25
+ ###
26
+ Tweet: "This new music video was incredibile"
27
+ Sentiment: Initial Ch</s>
28
+ 2024-04-25 05:47:16 - INFO : <s> Translate English to French:
29
+
30
+ sea otter => loutre de mer
31
+
32
+ peppermint => menthe poivrée
33
+
34
+ plush girafe => girafe peluche
35
+
36
+ cheese => S, ’O</s>
37
+ 2024-04-25 05:47:16 - INFO :
38
+ ==================Finish================
39
+
40
+ 2024-04-25 05:48:38 - INFO : PPL after pruning: {'wikitext2': 3075.5837511620985, 'ptb': 3485.092969906799}
41
+ 2024-04-25 05:48:38 - INFO : Memory Requirement: 4572.6494140625 MiB
42
+
vicuna_prune84/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/home/ubuntu/model_weights/vicuna-7b-v1.3",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "bos_token_id": 1,
7
+ "eos_token_id": 2,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 4096,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 11008,
12
+ "max_position_embeddings": 2048,
13
+ "model_type": "llama",
14
+ "num_attention_heads": 32,
15
+ "num_hidden_layers": 32,
16
+ "pad_token_id": 0,
17
+ "rms_norm_eps": 1e-06,
18
+ "tie_word_embeddings": false,
19
+ "torch_dtype": "float16",
20
+ "transformers_version": "4.28.1",
21
+ "use_cache": true,
22
+ "vocab_size": 32000
23
+ }
vicuna_prune84/description.txt ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - Training Parameters:
2
+ - base_model: lmsys/vicuna-7b-v1.3
3
+ - save_ckpt_log_name: llama_prune
4
+ - pruning_ratio: 0.84
5
+ - pruner_type: taylor
6
+ - temperature: 1.0
7
+ - top_p: 0.95
8
+ - max_seq_len: 128
9
+ - channel_wise: False
10
+ - block_wise: True
11
+ - layer_wise: False
12
+ - layer: 12
13
+ - block_attention_layer_start: 4
14
+ - block_attention_layer_end: 30
15
+ - block_mlp_layer_start: 4
16
+ - block_mlp_layer_end: 30
17
+ - iterative_steps: 1
18
+ - grouping_strategy: sum
19
+ - global_pruning: False
20
+ - taylor: param_first
21
+ - num_examples: 10
22
+ - device: cpu
23
+ - test_before_train: False
24
+ - eval_device: cuda
25
+ - test_after_train: True
26
+ - seed: 42
27
+ - save_model: True
28
+ - torch_version: 2.2
vicuna_prune84/generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.28.1"
7
+ }
vicuna_prune84/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:113fa87622ba6b8cb631d9ea2f108aef83a3a938841d0dc20ed5ffb489d26077
3
+ size 4767303626
vicuna_prune84/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<unk>",
17
+ "unk_token": {
18
+ "content": "<unk>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }