Jazzweller commited on
Commit
3181777
1 Parent(s): b1eb970

End of training

Browse files
all_results.json CHANGED
@@ -2,12 +2,12 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.2857142857142857,
4
  "eval_loss": 0.7827825546264648,
5
- "eval_runtime": 0.7631,
6
- "eval_samples_per_second": 9.173,
7
- "eval_steps_per_second": 1.31,
8
  "total_flos": 4250374116581376.0,
9
  "train_loss": 0.17864632606506348,
10
- "train_runtime": 50.2769,
11
- "train_samples_per_second": 3.401,
12
- "train_steps_per_second": 0.06
13
  }
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.2857142857142857,
4
  "eval_loss": 0.7827825546264648,
5
+ "eval_runtime": 0.7719,
6
+ "eval_samples_per_second": 9.069,
7
+ "eval_steps_per_second": 1.296,
8
  "total_flos": 4250374116581376.0,
9
  "train_loss": 0.17864632606506348,
10
+ "train_runtime": 45.1081,
11
+ "train_samples_per_second": 3.791,
12
+ "train_steps_per_second": 0.067
13
  }
eval_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.2857142857142857,
4
  "eval_loss": 0.7827825546264648,
5
- "eval_runtime": 0.7631,
6
- "eval_samples_per_second": 9.173,
7
- "eval_steps_per_second": 1.31
8
  }
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.2857142857142857,
4
  "eval_loss": 0.7827825546264648,
5
+ "eval_runtime": 0.7719,
6
+ "eval_samples_per_second": 9.069,
7
+ "eval_steps_per_second": 1.296
8
  }
runs/May28_20-29-12_38183ecde2ad/events.out.tfevents.1653769965.38183ecde2ad.92.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0314f2fc5883fd130b79edb3239ac9872e4642746d66e561b0076e0b154a05ce
3
+ size 357
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 3.0,
3
  "total_flos": 4250374116581376.0,
4
  "train_loss": 0.17864632606506348,
5
- "train_runtime": 50.2769,
6
- "train_samples_per_second": 3.401,
7
- "train_steps_per_second": 0.06
8
  }
 
2
  "epoch": 3.0,
3
  "total_flos": 4250374116581376.0,
4
  "train_loss": 0.17864632606506348,
5
+ "train_runtime": 45.1081,
6
+ "train_samples_per_second": 3.791,
7
+ "train_steps_per_second": 0.067
8
  }
trainer_state.json CHANGED
@@ -11,27 +11,27 @@
11
  "epoch": 1.0,
12
  "eval_accuracy": 0.2857142857142857,
13
  "eval_loss": 0.7827825546264648,
14
- "eval_runtime": 0.7129,
15
- "eval_samples_per_second": 9.819,
16
- "eval_steps_per_second": 1.403,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 2.0,
21
  "eval_accuracy": 0.14285714285714285,
22
  "eval_loss": 0.8606036901473999,
23
- "eval_runtime": 0.7151,
24
- "eval_samples_per_second": 9.789,
25
- "eval_steps_per_second": 1.398,
26
  "step": 2
27
  },
28
  {
29
  "epoch": 3.0,
30
  "eval_accuracy": 0.2857142857142857,
31
- "eval_loss": 0.8618679046630859,
32
- "eval_runtime": 0.7739,
33
- "eval_samples_per_second": 9.045,
34
- "eval_steps_per_second": 1.292,
35
  "step": 3
36
  },
37
  {
@@ -39,9 +39,9 @@
39
  "step": 3,
40
  "total_flos": 4250374116581376.0,
41
  "train_loss": 0.17864632606506348,
42
- "train_runtime": 50.2769,
43
- "train_samples_per_second": 3.401,
44
- "train_steps_per_second": 0.06
45
  }
46
  ],
47
  "max_steps": 3,
 
11
  "epoch": 1.0,
12
  "eval_accuracy": 0.2857142857142857,
13
  "eval_loss": 0.7827825546264648,
14
+ "eval_runtime": 0.7023,
15
+ "eval_samples_per_second": 9.967,
16
+ "eval_steps_per_second": 1.424,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 2.0,
21
  "eval_accuracy": 0.14285714285714285,
22
  "eval_loss": 0.8606036901473999,
23
+ "eval_runtime": 0.6969,
24
+ "eval_samples_per_second": 10.044,
25
+ "eval_steps_per_second": 1.435,
26
  "step": 2
27
  },
28
  {
29
  "epoch": 3.0,
30
  "eval_accuracy": 0.2857142857142857,
31
+ "eval_loss": 0.8618678450584412,
32
+ "eval_runtime": 0.7824,
33
+ "eval_samples_per_second": 8.947,
34
+ "eval_steps_per_second": 1.278,
35
  "step": 3
36
  },
37
  {
 
39
  "step": 3,
40
  "total_flos": 4250374116581376.0,
41
  "train_loss": 0.17864632606506348,
42
+ "train_runtime": 45.1081,
43
+ "train_samples_per_second": 3.791,
44
+ "train_steps_per_second": 0.067
45
  }
46
  ],
47
  "max_steps": 3,