aengusl commited on
Commit
39533ae
1 Parent(s): 1d3dcbf

Model save

Browse files
README.md CHANGED
@@ -48,6 +48,6 @@ The following hyperparameters were used during training:
48
  ### Framework versions
49
 
50
  - Transformers 4.35.0
51
- - Pytorch 2.1.0+cu121
52
- - Datasets 2.14.6
53
  - Tokenizers 0.14.1
 
48
  ### Framework versions
49
 
50
  - Transformers 4.35.0
51
+ - Pytorch 2.2.0+cu121
52
+ - Datasets 2.14.7
53
  - Tokenizers 0.14.1
adapter_config.json CHANGED
@@ -8,20 +8,24 @@
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
 
11
  "lora_alpha": 16,
12
  "lora_dropout": 0.1,
 
 
13
  "modules_to_save": null,
14
  "peft_type": "LORA",
15
  "r": 64,
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
19
- "o_proj",
20
- "k_proj",
21
  "v_proj",
22
- "up_proj",
23
  "q_proj",
24
- "down_proj"
 
 
 
25
  ],
26
- "task_type": "CAUSAL_LM"
 
27
  }
 
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
+ "loftq_config": {},
12
  "lora_alpha": 16,
13
  "lora_dropout": 0.1,
14
+ "megatron_config": null,
15
+ "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
  "r": 64,
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
 
22
  "v_proj",
 
23
  "q_proj",
24
+ "up_proj",
25
+ "down_proj",
26
+ "o_proj",
27
+ "k_proj"
28
  ],
29
+ "task_type": "CAUSAL_LM",
30
+ "use_rslora": false
31
  }
runs/May17_08-54-31_c842148f8542/events.out.tfevents.1715936167.c842148f8542.173323.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf6fc5d31fe36b0b3dc9fac3e26278d26bf02eb9889cf80c27f76d7b51899a46
3
+ size 4308
step_0/README.md CHANGED
@@ -18,6 +18,7 @@ base_model: meta-llama/Llama-2-7b-chat-hf
18
 
19
 
20
  - **Developed by:** [More Information Needed]
 
21
  - **Shared by [optional]:** [More Information Needed]
22
  - **Model type:** [More Information Needed]
23
  - **Language(s) (NLP):** [More Information Needed]
@@ -76,7 +77,7 @@ Use the code below to get started with the model.
76
 
77
  ### Training Data
78
 
79
- <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
80
 
81
  [More Information Needed]
82
 
@@ -107,7 +108,7 @@ Use the code below to get started with the model.
107
 
108
  #### Testing Data
109
 
110
- <!-- This should link to a Data Card if possible. -->
111
 
112
  [More Information Needed]
113
 
@@ -198,66 +199,6 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
198
  [More Information Needed]
199
 
200
 
201
- ## Training procedure
202
-
203
-
204
- ### Framework versions
205
-
206
-
207
- - PEFT 0.6.1
208
- ## Training procedure
209
-
210
-
211
- ### Framework versions
212
-
213
-
214
- - PEFT 0.6.1
215
- ## Training procedure
216
-
217
-
218
- ### Framework versions
219
-
220
-
221
- - PEFT 0.6.1
222
- ## Training procedure
223
-
224
-
225
- ### Framework versions
226
-
227
-
228
- - PEFT 0.6.1
229
- ## Training procedure
230
-
231
-
232
  ### Framework versions
233
 
234
-
235
- - PEFT 0.6.1
236
- ## Training procedure
237
-
238
-
239
- ### Framework versions
240
-
241
-
242
- - PEFT 0.6.1
243
- ## Training procedure
244
-
245
-
246
- ### Framework versions
247
-
248
-
249
- - PEFT 0.6.1
250
- ## Training procedure
251
-
252
-
253
- ### Framework versions
254
-
255
-
256
- - PEFT 0.6.1
257
- ## Training procedure
258
-
259
-
260
- ### Framework versions
261
-
262
-
263
- - PEFT 0.6.1
 
18
 
19
 
20
  - **Developed by:** [More Information Needed]
21
+ - **Funded by [optional]:** [More Information Needed]
22
  - **Shared by [optional]:** [More Information Needed]
23
  - **Model type:** [More Information Needed]
24
  - **Language(s) (NLP):** [More Information Needed]
 
77
 
78
  ### Training Data
79
 
80
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
81
 
82
  [More Information Needed]
83
 
 
108
 
109
  #### Testing Data
110
 
111
+ <!-- This should link to a Dataset Card if possible. -->
112
 
113
  [More Information Needed]
114
 
 
199
  [More Information Needed]
200
 
201
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
202
  ### Framework versions
203
 
204
+ - PEFT 0.8.2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
step_0/adapter_config.json CHANGED
@@ -8,20 +8,24 @@
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
 
11
  "lora_alpha": 16,
12
  "lora_dropout": 0.1,
 
 
13
  "modules_to_save": null,
14
  "peft_type": "LORA",
15
  "r": 64,
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
19
- "o_proj",
20
- "k_proj",
21
  "v_proj",
22
- "up_proj",
23
  "q_proj",
24
- "down_proj"
 
 
 
25
  ],
26
- "task_type": "CAUSAL_LM"
 
27
  }
 
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
+ "loftq_config": {},
12
  "lora_alpha": 16,
13
  "lora_dropout": 0.1,
14
+ "megatron_config": null,
15
+ "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
  "r": 64,
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
 
22
  "v_proj",
 
23
  "q_proj",
24
+ "up_proj",
25
+ "down_proj",
26
+ "o_proj",
27
+ "k_proj"
28
  ],
29
+ "task_type": "CAUSAL_LM",
30
+ "use_rslora": false
31
  }
step_0/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5fc9636bd68b1bfb0f3387ff1cc2c04a3bdd76543b748ab2b1b0380fbfd624e
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4f6a2d68f11d33fcf2104f78f607f78b0659939807a12b62e4a97cedb2025de
3
  size 5560
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5fc9636bd68b1bfb0f3387ff1cc2c04a3bdd76543b748ab2b1b0380fbfd624e
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4f6a2d68f11d33fcf2104f78f607f78b0659939807a12b62e4a97cedb2025de
3
  size 5560