gokuls commited on
Commit
b03fdeb
·
1 Parent(s): ea5a84b

End of training

Browse files
README.md CHANGED
@@ -1,12 +1,30 @@
1
  ---
 
 
2
  tags:
3
  - generated_from_trainer
 
 
4
  metrics:
5
  - accuracy
6
  - f1
7
  model-index:
8
  - name: hBERTv1_data_aug_mrpc
9
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  ---
11
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -14,12 +32,12 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # hBERTv1_data_aug_mrpc
16
 
17
- This model is a fine-tuned version of [gokuls/bert_12_layer_model_v1](https://huggingface.co/gokuls/bert_12_layer_model_v1) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.0164
20
- - Accuracy: 0.9975
21
- - F1: 0.9982
22
- - Combined Score: 0.9979
23
 
24
  ## Model description
25
 
 
1
  ---
2
+ language:
3
+ - en
4
  tags:
5
  - generated_from_trainer
6
+ datasets:
7
+ - glue
8
  metrics:
9
  - accuracy
10
  - f1
11
  model-index:
12
  - name: hBERTv1_data_aug_mrpc
13
+ results:
14
+ - task:
15
+ name: Text Classification
16
+ type: text-classification
17
+ dataset:
18
+ name: GLUE MRPC
19
+ type: glue
20
+ args: mrpc
21
+ metrics:
22
+ - name: Accuracy
23
+ type: accuracy
24
+ value: 1.0
25
+ - name: F1
26
+ type: f1
27
+ value: 1.0
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  # hBERTv1_data_aug_mrpc
34
 
35
+ This model is a fine-tuned version of [gokuls/bert_12_layer_model_v1](https://huggingface.co/gokuls/bert_12_layer_model_v1) on the GLUE MRPC dataset.
36
  It achieves the following results on the evaluation set:
37
+ - Loss: 0.0001
38
+ - Accuracy: 1.0
39
+ - F1: 1.0
40
+ - Combined Score: 1.0
41
 
42
  ## Model description
43
 
all_results.json CHANGED
@@ -4,13 +4,13 @@
4
  "eval_combined_score": 1.0,
5
  "eval_f1": 1.0,
6
  "eval_loss": 5.569791028392501e-05,
7
- "eval_runtime": 0.5673,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 719.251,
10
- "eval_steps_per_second": 3.526,
11
  "train_loss": 0.01846268490869172,
12
- "train_runtime": 9463.9723,
13
  "train_samples": 250736,
14
- "train_samples_per_second": 1324.687,
15
- "train_steps_per_second": 5.178
16
  }
 
4
  "eval_combined_score": 1.0,
5
  "eval_f1": 1.0,
6
  "eval_loss": 5.569791028392501e-05,
7
+ "eval_runtime": 0.5567,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 732.91,
10
+ "eval_steps_per_second": 3.593,
11
  "train_loss": 0.01846268490869172,
12
+ "train_runtime": 9240.4943,
13
  "train_samples": 250736,
14
+ "train_samples_per_second": 1356.724,
15
+ "train_steps_per_second": 5.303
16
  }
eval_results.json CHANGED
@@ -4,8 +4,8 @@
4
  "eval_combined_score": 1.0,
5
  "eval_f1": 1.0,
6
  "eval_loss": 5.569791028392501e-05,
7
- "eval_runtime": 0.5673,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 719.251,
10
- "eval_steps_per_second": 3.526
11
  }
 
4
  "eval_combined_score": 1.0,
5
  "eval_f1": 1.0,
6
  "eval_loss": 5.569791028392501e-05,
7
+ "eval_runtime": 0.5567,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 732.91,
10
+ "eval_steps_per_second": 3.593
11
  }
logs/events.out.tfevents.1677752051.serv-9223.249238.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:665afc9f886b5d6cbe7e0983d633e3eea6adb6757cd8bdeed6b7a8e9e3decc24
3
+ size 467
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
  "train_loss": 0.01846268490869172,
4
- "train_runtime": 9463.9723,
5
  "train_samples": 250736,
6
- "train_samples_per_second": 1324.687,
7
- "train_steps_per_second": 5.178
8
  }
 
1
  {
2
  "epoch": 10.0,
3
  "train_loss": 0.01846268490869172,
4
+ "train_runtime": 9240.4943,
5
  "train_samples": 250736,
6
+ "train_samples_per_second": 1356.724,
7
+ "train_steps_per_second": 5.303
8
  }
trainer_state.json CHANGED
@@ -19,9 +19,9 @@
19
  "eval_combined_score": 0.9978800554210951,
20
  "eval_f1": 0.998211091234347,
21
  "eval_loss": 0.004494799301028252,
22
- "eval_runtime": 0.5596,
23
- "eval_samples_per_second": 729.142,
24
- "eval_steps_per_second": 3.574,
25
  "step": 980
26
  },
27
  {
@@ -36,9 +36,9 @@
36
  "eval_combined_score": 1.0,
37
  "eval_f1": 1.0,
38
  "eval_loss": 6.0925009165657684e-05,
39
- "eval_runtime": 0.5584,
40
- "eval_samples_per_second": 730.667,
41
- "eval_steps_per_second": 3.582,
42
  "step": 1960
43
  },
44
  {
@@ -53,9 +53,9 @@
53
  "eval_combined_score": 1.0,
54
  "eval_f1": 1.0,
55
  "eval_loss": 8.451967732980847e-05,
56
- "eval_runtime": 0.5589,
57
- "eval_samples_per_second": 730.056,
58
- "eval_steps_per_second": 3.579,
59
  "step": 2940
60
  },
61
  {
@@ -70,9 +70,9 @@
70
  "eval_combined_score": 1.0,
71
  "eval_f1": 1.0,
72
  "eval_loss": 5.947695899521932e-05,
73
- "eval_runtime": 0.5569,
74
- "eval_samples_per_second": 732.679,
75
- "eval_steps_per_second": 3.592,
76
  "step": 3920
77
  },
78
  {
@@ -87,9 +87,9 @@
87
  "eval_combined_score": 1.0,
88
  "eval_f1": 1.0,
89
  "eval_loss": 5.569791028392501e-05,
90
- "eval_runtime": 0.556,
91
- "eval_samples_per_second": 733.848,
92
- "eval_steps_per_second": 3.597,
93
  "step": 4900
94
  },
95
  {
@@ -104,9 +104,9 @@
104
  "eval_combined_score": 1.0,
105
  "eval_f1": 1.0,
106
  "eval_loss": 0.00023545935982838273,
107
- "eval_runtime": 0.5589,
108
- "eval_samples_per_second": 730.007,
109
- "eval_steps_per_second": 3.578,
110
  "step": 5880
111
  },
112
  {
@@ -121,9 +121,9 @@
121
  "eval_combined_score": 1.0,
122
  "eval_f1": 1.0,
123
  "eval_loss": 0.0002702152996789664,
124
- "eval_runtime": 0.5598,
125
- "eval_samples_per_second": 728.83,
126
- "eval_steps_per_second": 3.573,
127
  "step": 6860
128
  },
129
  {
@@ -138,9 +138,9 @@
138
  "eval_combined_score": 0.997876843735699,
139
  "eval_f1": 0.9982046678635548,
140
  "eval_loss": 0.015019365586340427,
141
- "eval_runtime": 0.558,
142
- "eval_samples_per_second": 731.241,
143
- "eval_steps_per_second": 3.585,
144
  "step": 7840
145
  },
146
  {
@@ -155,9 +155,9 @@
155
  "eval_combined_score": 1.0,
156
  "eval_f1": 1.0,
157
  "eval_loss": 0.0014859754592180252,
158
- "eval_runtime": 0.5575,
159
- "eval_samples_per_second": 731.782,
160
- "eval_steps_per_second": 3.587,
161
  "step": 8820
162
  },
163
  {
@@ -172,9 +172,9 @@
172
  "eval_combined_score": 0.997876843735699,
173
  "eval_f1": 0.9982046678635548,
174
  "eval_loss": 0.016378218308091164,
175
- "eval_runtime": 0.5579,
176
- "eval_samples_per_second": 731.36,
177
- "eval_steps_per_second": 3.585,
178
  "step": 9800
179
  },
180
  {
@@ -182,9 +182,9 @@
182
  "step": 9800,
183
  "total_flos": 3.167072376848384e+17,
184
  "train_loss": 0.01846268490869172,
185
- "train_runtime": 9463.9723,
186
- "train_samples_per_second": 1324.687,
187
- "train_steps_per_second": 5.178
188
  }
189
  ],
190
  "max_steps": 49000,
 
19
  "eval_combined_score": 0.9978800554210951,
20
  "eval_f1": 0.998211091234347,
21
  "eval_loss": 0.004494799301028252,
22
+ "eval_runtime": 0.5297,
23
+ "eval_samples_per_second": 770.282,
24
+ "eval_steps_per_second": 3.776,
25
  "step": 980
26
  },
27
  {
 
36
  "eval_combined_score": 1.0,
37
  "eval_f1": 1.0,
38
  "eval_loss": 6.0925009165657684e-05,
39
+ "eval_runtime": 0.5295,
40
+ "eval_samples_per_second": 770.515,
41
+ "eval_steps_per_second": 3.777,
42
  "step": 1960
43
  },
44
  {
 
53
  "eval_combined_score": 1.0,
54
  "eval_f1": 1.0,
55
  "eval_loss": 8.451967732980847e-05,
56
+ "eval_runtime": 0.5298,
57
+ "eval_samples_per_second": 770.156,
58
+ "eval_steps_per_second": 3.775,
59
  "step": 2940
60
  },
61
  {
 
70
  "eval_combined_score": 1.0,
71
  "eval_f1": 1.0,
72
  "eval_loss": 5.947695899521932e-05,
73
+ "eval_runtime": 0.5287,
74
+ "eval_samples_per_second": 771.7,
75
+ "eval_steps_per_second": 3.783,
76
  "step": 3920
77
  },
78
  {
 
87
  "eval_combined_score": 1.0,
88
  "eval_f1": 1.0,
89
  "eval_loss": 5.569791028392501e-05,
90
+ "eval_runtime": 0.5323,
91
+ "eval_samples_per_second": 766.547,
92
+ "eval_steps_per_second": 3.758,
93
  "step": 4900
94
  },
95
  {
 
104
  "eval_combined_score": 1.0,
105
  "eval_f1": 1.0,
106
  "eval_loss": 0.00023545935982838273,
107
+ "eval_runtime": 0.5293,
108
+ "eval_samples_per_second": 770.865,
109
+ "eval_steps_per_second": 3.779,
110
  "step": 5880
111
  },
112
  {
 
121
  "eval_combined_score": 1.0,
122
  "eval_f1": 1.0,
123
  "eval_loss": 0.0002702152996789664,
124
+ "eval_runtime": 0.5311,
125
+ "eval_samples_per_second": 768.279,
126
+ "eval_steps_per_second": 3.766,
127
  "step": 6860
128
  },
129
  {
 
138
  "eval_combined_score": 0.997876843735699,
139
  "eval_f1": 0.9982046678635548,
140
  "eval_loss": 0.015019365586340427,
141
+ "eval_runtime": 0.5296,
142
+ "eval_samples_per_second": 770.328,
143
+ "eval_steps_per_second": 3.776,
144
  "step": 7840
145
  },
146
  {
 
155
  "eval_combined_score": 1.0,
156
  "eval_f1": 1.0,
157
  "eval_loss": 0.0014859754592180252,
158
+ "eval_runtime": 0.5295,
159
+ "eval_samples_per_second": 770.576,
160
+ "eval_steps_per_second": 3.777,
161
  "step": 8820
162
  },
163
  {
 
172
  "eval_combined_score": 0.997876843735699,
173
  "eval_f1": 0.9982046678635548,
174
  "eval_loss": 0.016378218308091164,
175
+ "eval_runtime": 0.5299,
176
+ "eval_samples_per_second": 770.0,
177
+ "eval_steps_per_second": 3.775,
178
  "step": 9800
179
  },
180
  {
 
182
  "step": 9800,
183
  "total_flos": 3.167072376848384e+17,
184
  "train_loss": 0.01846268490869172,
185
+ "train_runtime": 9240.4943,
186
+ "train_samples_per_second": 1356.724,
187
+ "train_steps_per_second": 5.303
188
  }
189
  ],
190
  "max_steps": 49000,