cezeozue commited on
Commit
15c4d96
1 Parent(s): a0b7f51

Training in progress, step 1000

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:defcf6e9682cffdc896d2512350e4fb7c149eed82505a5bf8d05795296415fe3
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a83d23f9c280b1b78545a720da15a8e9067a3694eaf73c8bd335a73ff1dfdd14
3
  size 268290900
run-2/checkpoint-1000/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62954c319c3a71d4a603f6b3cf4985b061e766ecb6206a4cfd7509f4dd76eec7
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a83d23f9c280b1b78545a720da15a8e9067a3694eaf73c8bd335a73ff1dfdd14
3
  size 268290900
run-2/checkpoint-1000/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32625f94804cf2a328fd4e205909c2e722fbe7cd0f07a62e1a85fa4d62289dcd
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1faec2cc33f9d7476bd84fceedbe10a4bc0e8d45c79a2f77b3a030938d7b6f6d
3
  size 536643898
run-2/checkpoint-1000/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed9da1cbe846856af516cf037dd225e7f48e2737ef84c42a9bee0753b8c140ef
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60ef01273aaa599804d51a93c6c0c61874ebd50ab9e135a21aab5f7cd0e6487a
3
  size 1064
run-2/checkpoint-1000/trainer_state.json CHANGED
@@ -10,53 +10,53 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.5851612903225807,
14
- "eval_loss": 0.2035684436559677,
15
- "eval_runtime": 5.6989,
16
- "eval_samples_per_second": 543.962,
17
- "eval_steps_per_second": 11.406,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.57,
22
- "learning_rate": 1.550763701707098e-05,
23
- "loss": 0.3221,
24
  "step": 500
25
  },
26
  {
27
  "epoch": 2.0,
28
- "eval_accuracy": 0.8335483870967741,
29
- "eval_loss": 0.10106482356786728,
30
- "eval_runtime": 5.8785,
31
- "eval_samples_per_second": 527.345,
32
- "eval_steps_per_second": 11.057,
33
  "step": 636
34
  },
35
  {
36
  "epoch": 3.0,
37
- "eval_accuracy": 0.885483870967742,
38
- "eval_loss": 0.06870077550411224,
39
- "eval_runtime": 5.783,
40
- "eval_samples_per_second": 536.053,
41
- "eval_steps_per_second": 11.24,
42
  "step": 954
43
  },
44
  {
45
  "epoch": 3.14,
46
- "learning_rate": 1.101527403414196e-05,
47
- "loss": 0.1162,
48
  "step": 1000
49
  }
50
  ],
51
  "logging_steps": 500,
52
- "max_steps": 2226,
53
- "num_train_epochs": 7,
54
  "save_steps": 500,
55
  "total_flos": 259653090321324.0,
56
  "trial_name": null,
57
  "trial_params": {
58
- "alpha": 0.8305833099612083,
59
- "num_train_epochs": 7,
60
- "temperature": 12
61
  }
62
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6,
14
+ "eval_loss": 0.22239726781845093,
15
+ "eval_runtime": 5.4481,
16
+ "eval_samples_per_second": 569.006,
17
+ "eval_steps_per_second": 11.931,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.57,
22
+ "learning_rate": 1.4758909853249476e-05,
23
+ "loss": 0.3484,
24
  "step": 500
25
  },
26
  {
27
  "epoch": 2.0,
28
+ "eval_accuracy": 0.83,
29
+ "eval_loss": 0.109930619597435,
30
+ "eval_runtime": 5.7104,
31
+ "eval_samples_per_second": 542.874,
32
+ "eval_steps_per_second": 11.383,
33
  "step": 636
34
  },
35
  {
36
  "epoch": 3.0,
37
+ "eval_accuracy": 0.8809677419354839,
38
+ "eval_loss": 0.07449585199356079,
39
+ "eval_runtime": 5.3903,
40
+ "eval_samples_per_second": 575.109,
41
+ "eval_steps_per_second": 12.059,
42
  "step": 954
43
  },
44
  {
45
  "epoch": 3.14,
46
+ "learning_rate": 9.517819706498952e-06,
47
+ "loss": 0.1265,
48
  "step": 1000
49
  }
50
  ],
51
  "logging_steps": 500,
52
+ "max_steps": 1908,
53
+ "num_train_epochs": 6,
54
  "save_steps": 500,
55
  "total_flos": 259653090321324.0,
56
  "trial_name": null,
57
  "trial_params": {
58
+ "alpha": 0.339174080203406,
59
+ "num_train_epochs": 6,
60
+ "temperature": 7
61
  }
62
  }
run-2/checkpoint-1000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c739c287048413530d77539873d77810678560a3c9c21cac037ba107d1ab725
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bcd9576316ea4b78c0edb02ef77b7b54c380e6454ae67bc0bbd59e18e13a200
3
  size 4664
runs/Jan25_17-40-54_c146da53f02f/events.out.tfevents.1706206065.c146da53f02f.3236.3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46114877c11dabd5fcd268e5b4ecae043cfe37e1181b779db417effb4f0bae7e
3
- size 12644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f24128428e8f274ac37e8f5de24cca3e5f330964e2cd9cca05f88629521eaf78
3
+ size 13447