sjssmits commited on
Commit
dcf5c46
1 Parent(s): d7917d1

Upload 8 files

Browse files
Files changed (8) hide show
  1. config.json +19 -0
  2. optimizer.pt +3 -0
  3. pytorch_model.bin +3 -0
  4. rng_state.pth +3 -0
  5. scaler.pt +3 -0
  6. scheduler.pt +3 -0
  7. trainer_state.json +46 -0
  8. training_args.bin +3 -0
config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base_model_name_or_path": "tiiuae/falcon-7b",
3
+ "bias": "none",
4
+ "fan_in_fan_out": false,
5
+ "inference_mode": true,
6
+ "init_lora_weights": true,
7
+ "layers_pattern": null,
8
+ "layers_to_transform": null,
9
+ "lora_alpha": 32,
10
+ "lora_dropout": 0.05,
11
+ "modules_to_save": null,
12
+ "peft_type": "LORA",
13
+ "r": 16,
14
+ "revision": null,
15
+ "target_modules": [
16
+ "query_key_value"
17
+ ],
18
+ "task_type": "CAUSAL_LM"
19
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ecab024c5d20a1151bdf0658bb0bd23bb91961142f344527dcebf002a86dfbc
3
+ size 9531525
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80b6264c639c02f1b8d554515396a815c6e6abf6778d00980f8945e8e58aee71
3
+ size 4239589376
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9399f6dde12609dd62e4d5076ad7a464174d06799555dfc9242e7fc2f53065d
3
+ size 14575
scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a95fdc55ecbff0378151dbbb3958b50a34ae8909668008b5a61d05747f09326
3
+ size 557
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f37bb4f0ce606e2cfe1f76c35ef18d60e39dbaf4a5b0133dc7717a93a25b0d1
3
+ size 627
trainer_state.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 8.0,
5
+ "global_step": 500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.6,
12
+ "learning_rate": 0.0001996129859609174,
13
+ "loss": 2.4955,
14
+ "step": 100
15
+ },
16
+ {
17
+ "epoch": 3.2,
18
+ "learning_rate": 0.00019377521321470805,
19
+ "loss": 1.3769,
20
+ "step": 200
21
+ },
22
+ {
23
+ "epoch": 4.8,
24
+ "learning_rate": 0.00018130731609142177,
25
+ "loss": 1.2148,
26
+ "step": 300
27
+ },
28
+ {
29
+ "epoch": 6.4,
30
+ "learning_rate": 0.00016309080374272232,
31
+ "loss": 1.0464,
32
+ "step": 400
33
+ },
34
+ {
35
+ "epoch": 8.0,
36
+ "learning_rate": 0.00014041362570717172,
37
+ "loss": 0.8909,
38
+ "step": 500
39
+ }
40
+ ],
41
+ "max_steps": 1240,
42
+ "num_train_epochs": 20,
43
+ "total_flos": 1.9338439110721536e+16,
44
+ "trial_name": null,
45
+ "trial_params": null
46
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1270302e7af81cdbde191a8d8f6656bae02608060d06b2ae9fc17323473c696
3
+ size 3899