simonmok commited on
Commit
a6856f1
·
verified ·
1 Parent(s): c9014bf

Training in progress, step 500

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:483d35db5a9e0274d13ceb4de46f67de2ae9de87d1c21da4b62e40ba3bbc1f19
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07161090aa695b836b3109e56422c48659d0ff109ddde1739e80c7dbac69dcee
3
  size 268290900
run-0/checkpoint-3000/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04e267073b83a3774be9767ceb552868f5ad6ba81e9c23d4300b1b085f4b41bd
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46b3eeae7a828221d48c3afdc388d80e26d0a581d2e64ad92b94d9ed549da0f3
3
  size 268290900
run-0/checkpoint-3000/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bec0da93d5c7afc4f75be2b83d1cdf51aa6b187b10bc1a76ee309f76f2606cfa
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77ff61fd99d0714fffc3df5ec06b987ba9ac00abbdb3de905fc7286b0bf7008a
3
  size 536643898
run-0/checkpoint-3000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5d96ed9889a2a02e4c7dbb49c09c58f3c154dfd2cb3d0452d915d37d9ed5e34
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:235bcd30eb5caaf6d85f48a7cbef42afd59119224ef62ab684da9f5c869126f8
3
  size 5368
run-0/checkpoint-3180/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72a8680587911942633689b6b4125cba31cd037c3cc19cfad4d8ef38e10fcab3
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49f4f654fad95fcb02fa6113e96bd7fca48a3a9b57102a1e9cbac9fd6a1db37f
3
  size 268290900
run-0/checkpoint-3180/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d049f940b3dc867a6e9b52ba894ed598afd5815cc9844758f57857b61d4a87e6
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fc6947ee09ed474860810aeccd221c427a3d4b87f6c326fc1ad0ce52001ace3
3
  size 536643898
run-0/checkpoint-3180/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5d96ed9889a2a02e4c7dbb49c09c58f3c154dfd2cb3d0452d915d37d9ed5e34
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:235bcd30eb5caaf6d85f48a7cbef42afd59119224ef62ab684da9f5c869126f8
3
  size 5368
run-1/checkpoint-1000/trainer_state.json CHANGED
@@ -10,50 +10,50 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.6364516129032258,
14
- "eval_loss": 0.2942647337913513,
15
- "eval_runtime": 5.7495,
16
- "eval_samples_per_second": 539.181,
17
- "eval_steps_per_second": 11.305,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
- "grad_norm": 0.6808456778526306,
23
- "learning_rate": 1.550763701707098e-05,
24
- "loss": 0.4631,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
- "eval_accuracy": 0.837741935483871,
30
- "eval_loss": 0.12298235297203064,
31
- "eval_runtime": 5.982,
32
- "eval_samples_per_second": 518.218,
33
- "eval_steps_per_second": 10.866,
34
  "step": 636
35
  },
36
  {
37
  "epoch": 3.0,
38
- "eval_accuracy": 0.886774193548387,
39
- "eval_loss": 0.07365494966506958,
40
- "eval_runtime": 5.4854,
41
- "eval_samples_per_second": 565.141,
42
- "eval_steps_per_second": 11.85,
43
  "step": 954
44
  },
45
  {
46
  "epoch": 3.1446540880503147,
47
- "grad_norm": 0.7211179137229919,
48
- "learning_rate": 1.101527403414196e-05,
49
- "loss": 0.144,
50
  "step": 1000
51
  }
52
  ],
53
  "logging_steps": 500,
54
- "max_steps": 2226,
55
  "num_input_tokens_seen": 0,
56
- "num_train_epochs": 7,
57
  "save_steps": 500,
58
  "stateful_callbacks": {
59
  "TrainerControl": {
@@ -71,8 +71,8 @@
71
  "train_batch_size": 48,
72
  "trial_name": null,
73
  "trial_params": {
74
- "alpha": 0.27523519283703446,
75
- "num_train_epochs": 7,
76
- "temperature": 3
77
  }
78
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6106451612903225,
14
+ "eval_loss": 0.2180573046207428,
15
+ "eval_runtime": 5.4534,
16
+ "eval_samples_per_second": 568.452,
17
+ "eval_steps_per_second": 11.919,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
+ "grad_norm": 0.5000836253166199,
23
+ "learning_rate": 1.685534591194969e-05,
24
+ "loss": 0.3508,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
+ "eval_accuracy": 0.8367741935483871,
30
+ "eval_loss": 0.10006564110517502,
31
+ "eval_runtime": 5.8746,
32
+ "eval_samples_per_second": 527.697,
33
+ "eval_steps_per_second": 11.065,
34
  "step": 636
35
  },
36
  {
37
  "epoch": 3.0,
38
+ "eval_accuracy": 0.8880645161290323,
39
+ "eval_loss": 0.06387896835803986,
40
+ "eval_runtime": 5.5911,
41
+ "eval_samples_per_second": 554.452,
42
+ "eval_steps_per_second": 11.626,
43
  "step": 954
44
  },
45
  {
46
  "epoch": 3.1446540880503147,
47
+ "grad_norm": 0.5663716197013855,
48
+ "learning_rate": 1.371069182389937e-05,
49
+ "loss": 0.1169,
50
  "step": 1000
51
  }
52
  ],
53
  "logging_steps": 500,
54
+ "max_steps": 3180,
55
  "num_input_tokens_seen": 0,
56
+ "num_train_epochs": 10,
57
  "save_steps": 500,
58
  "stateful_callbacks": {
59
  "TrainerControl": {
 
71
  "train_batch_size": 48,
72
  "trial_name": null,
73
  "trial_params": {
74
+ "alpha": 0.9382110737628452,
75
+ "num_train_epochs": 10,
76
+ "temperature": 6
77
  }
78
  }
run-1/checkpoint-500/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cd6c1fa18c08f721120761bd2b8759e0e49a2bed40a99f2e3983ef95cc42964
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07161090aa695b836b3109e56422c48659d0ff109ddde1739e80c7dbac69dcee
3
  size 268290900
run-1/checkpoint-500/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:892905aa43fd219554759899ef36ed6c84a1859236e2551bde01b6a9964f1199
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:026cd375591dc5083103d510969258e5b3bfdfc5a1ced96fd5734113ba364898
3
  size 536643898
run-1/checkpoint-500/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11e744277c61f87520794334442fae36c5f9ff6e10cb79d4bfee5176ca7eafe2
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04366f62f8f88f5a8265df59adb051b320463277845db80e7fa43f13110c18c9
3
  size 1064
run-1/checkpoint-500/trainer_state.json CHANGED
@@ -10,25 +10,25 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.6364516129032258,
14
- "eval_loss": 0.2942647337913513,
15
- "eval_runtime": 5.7495,
16
- "eval_samples_per_second": 539.181,
17
- "eval_steps_per_second": 11.305,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
- "grad_norm": 0.6808456778526306,
23
- "learning_rate": 1.550763701707098e-05,
24
- "loss": 0.4631,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
- "max_steps": 2226,
30
  "num_input_tokens_seen": 0,
31
- "num_train_epochs": 7,
32
  "save_steps": 500,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
@@ -46,8 +46,8 @@
46
  "train_batch_size": 48,
47
  "trial_name": null,
48
  "trial_params": {
49
- "alpha": 0.27523519283703446,
50
- "num_train_epochs": 7,
51
- "temperature": 3
52
  }
53
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6106451612903225,
14
+ "eval_loss": 0.2180573046207428,
15
+ "eval_runtime": 5.4534,
16
+ "eval_samples_per_second": 568.452,
17
+ "eval_steps_per_second": 11.919,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
+ "grad_norm": 0.5000836253166199,
23
+ "learning_rate": 1.685534591194969e-05,
24
+ "loss": 0.3508,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
+ "max_steps": 3180,
30
  "num_input_tokens_seen": 0,
31
+ "num_train_epochs": 10,
32
  "save_steps": 500,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
 
46
  "train_batch_size": 48,
47
  "trial_name": null,
48
  "trial_params": {
49
+ "alpha": 0.9382110737628452,
50
+ "num_train_epochs": 10,
51
+ "temperature": 6
52
  }
53
  }
run-1/checkpoint-500/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c50be35dabf57488910ecef52dcf0c3f00eb115989d551ba66b159364e8ee11
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:235bcd30eb5caaf6d85f48a7cbef42afd59119224ef62ab684da9f5c869126f8
3
  size 5368
runs/Nov25_08-56-26_a78cb449300a/events.out.tfevents.1732527563.a78cb449300a.701.5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06181206223d415c8f4cacccfdbc0686a5356fd2f9d84b91484ded39cd6be4fa
3
- size 31454
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3ada0fbdf4700ec40a3d76ca520d4fccd14de22b457fddc0a8e9c3c1f9c1e3e
3
+ size 32131
runs/Nov25_08-56-26_a78cb449300a/events.out.tfevents.1732528693.a78cb449300a.701.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93bec0e1d68ce0be5270f2972e875d4a42e30ff869a6d555bc000776fbd7d027
3
+ size 13952