Upload 8 files
Browse files- config.json +19 -0
- optimizer.pt +3 -0
- pytorch_model.bin +3 -0
- rng_state.pth +3 -0
- scaler.pt +3 -0
- scheduler.pt +3 -0
- trainer_state.json +46 -0
- training_args.bin +3 -0
config.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"base_model_name_or_path": "tiiuae/falcon-7b",
|
3 |
+
"bias": "none",
|
4 |
+
"fan_in_fan_out": false,
|
5 |
+
"inference_mode": true,
|
6 |
+
"init_lora_weights": true,
|
7 |
+
"layers_pattern": null,
|
8 |
+
"layers_to_transform": null,
|
9 |
+
"lora_alpha": 32,
|
10 |
+
"lora_dropout": 0.05,
|
11 |
+
"modules_to_save": null,
|
12 |
+
"peft_type": "LORA",
|
13 |
+
"r": 16,
|
14 |
+
"revision": null,
|
15 |
+
"target_modules": [
|
16 |
+
"query_key_value"
|
17 |
+
],
|
18 |
+
"task_type": "CAUSAL_LM"
|
19 |
+
}
|
optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ecab024c5d20a1151bdf0658bb0bd23bb91961142f344527dcebf002a86dfbc
|
3 |
+
size 9531525
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80b6264c639c02f1b8d554515396a815c6e6abf6778d00980f8945e8e58aee71
|
3 |
+
size 4239589376
|
rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9399f6dde12609dd62e4d5076ad7a464174d06799555dfc9242e7fc2f53065d
|
3 |
+
size 14575
|
scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a95fdc55ecbff0378151dbbb3958b50a34ae8909668008b5a61d05747f09326
|
3 |
+
size 557
|
scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f37bb4f0ce606e2cfe1f76c35ef18d60e39dbaf4a5b0133dc7717a93a25b0d1
|
3 |
+
size 627
|
trainer_state.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 8.0,
|
5 |
+
"global_step": 500,
|
6 |
+
"is_hyper_param_search": false,
|
7 |
+
"is_local_process_zero": true,
|
8 |
+
"is_world_process_zero": true,
|
9 |
+
"log_history": [
|
10 |
+
{
|
11 |
+
"epoch": 1.6,
|
12 |
+
"learning_rate": 0.0001996129859609174,
|
13 |
+
"loss": 2.4955,
|
14 |
+
"step": 100
|
15 |
+
},
|
16 |
+
{
|
17 |
+
"epoch": 3.2,
|
18 |
+
"learning_rate": 0.00019377521321470805,
|
19 |
+
"loss": 1.3769,
|
20 |
+
"step": 200
|
21 |
+
},
|
22 |
+
{
|
23 |
+
"epoch": 4.8,
|
24 |
+
"learning_rate": 0.00018130731609142177,
|
25 |
+
"loss": 1.2148,
|
26 |
+
"step": 300
|
27 |
+
},
|
28 |
+
{
|
29 |
+
"epoch": 6.4,
|
30 |
+
"learning_rate": 0.00016309080374272232,
|
31 |
+
"loss": 1.0464,
|
32 |
+
"step": 400
|
33 |
+
},
|
34 |
+
{
|
35 |
+
"epoch": 8.0,
|
36 |
+
"learning_rate": 0.00014041362570717172,
|
37 |
+
"loss": 0.8909,
|
38 |
+
"step": 500
|
39 |
+
}
|
40 |
+
],
|
41 |
+
"max_steps": 1240,
|
42 |
+
"num_train_epochs": 20,
|
43 |
+
"total_flos": 1.9338439110721536e+16,
|
44 |
+
"trial_name": null,
|
45 |
+
"trial_params": null
|
46 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1270302e7af81cdbde191a8d8f6656bae02608060d06b2ae9fc17323473c696
|
3 |
+
size 3899
|