gokuls commited on
Commit
8f87fb4
1 Parent(s): 1afce48

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  tags:
3
  - generated_from_trainer
4
  datasets:
@@ -13,7 +15,7 @@ model-index:
13
  name: Text Classification
14
  type: text-classification
15
  dataset:
16
- name: glue
17
  type: glue
18
  config: mrpc
19
  split: validation
@@ -21,10 +23,10 @@ model-index:
21
  metrics:
22
  - name: Accuracy
23
  type: accuracy
24
- value: 0.6838235294117647
25
  - name: F1
26
  type: f1
27
- value: 0.7809847198641766
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,12 +34,12 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  # hBERTv1_mrpc
34
 
35
- This model is a fine-tuned version of [gokuls/bert_12_layer_model_v1](https://huggingface.co/gokuls/bert_12_layer_model_v1) on the glue dataset.
36
  It achieves the following results on the evaluation set:
37
- - Loss: 0.9708
38
- - Accuracy: 0.6838
39
- - F1: 0.7810
40
- - Combined Score: 0.7324
41
 
42
  ## Model description
43
 
 
1
  ---
2
+ language:
3
+ - en
4
  tags:
5
  - generated_from_trainer
6
  datasets:
 
15
  name: Text Classification
16
  type: text-classification
17
  dataset:
18
+ name: GLUE MRPC
19
  type: glue
20
  config: mrpc
21
  split: validation
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.6862745098039216
27
  - name: F1
28
  type: f1
29
+ value: 0.7999999999999999
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  # hBERTv1_mrpc
36
 
37
+ This model is a fine-tuned version of [gokuls/bert_12_layer_model_v1](https://huggingface.co/gokuls/bert_12_layer_model_v1) on the GLUE MRPC dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.6051
40
+ - Accuracy: 0.6863
41
+ - F1: 0.8000
42
+ - Combined Score: 0.7431
43
 
44
  ## Model description
45
 
all_results.json CHANGED
@@ -4,13 +4,13 @@
4
  "eval_combined_score": 0.7431372549019608,
5
  "eval_f1": 0.7999999999999999,
6
  "eval_loss": 0.6050820350646973,
7
- "eval_runtime": 0.5403,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 755.096,
10
- "eval_steps_per_second": 3.701,
11
- "train_loss": 0.4964691546228197,
12
- "train_runtime": 203.7797,
13
  "train_samples": 3668,
14
- "train_samples_per_second": 899.991,
15
- "train_steps_per_second": 3.68
16
  }
 
4
  "eval_combined_score": 0.7431372549019608,
5
  "eval_f1": 0.7999999999999999,
6
  "eval_loss": 0.6050820350646973,
7
+ "eval_runtime": 0.5155,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 791.396,
10
+ "eval_steps_per_second": 3.879,
11
+ "train_loss": 0.14563740226957533,
12
+ "train_runtime": 96.9183,
13
  "train_samples": 3668,
14
+ "train_samples_per_second": 1892.315,
15
+ "train_steps_per_second": 7.738
16
  }
eval_results.json CHANGED
@@ -4,8 +4,8 @@
4
  "eval_combined_score": 0.7431372549019608,
5
  "eval_f1": 0.7999999999999999,
6
  "eval_loss": 0.6050820350646973,
7
- "eval_runtime": 0.5403,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 755.096,
10
- "eval_steps_per_second": 3.701
11
  }
 
4
  "eval_combined_score": 0.7431372549019608,
5
  "eval_f1": 0.7999999999999999,
6
  "eval_loss": 0.6050820350646973,
7
+ "eval_runtime": 0.5155,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 791.396,
10
+ "eval_steps_per_second": 3.879
11
  }
logs/events.out.tfevents.1677709281.serv-9225.3038038.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16037de5fbcf6993efcf9449fc4b6614f4c60d4752d2bc547e3b9fa9fbbabad6
3
+ size 467
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 12.0,
3
- "train_loss": 0.4964691546228197,
4
- "train_runtime": 203.7797,
5
  "train_samples": 3668,
6
- "train_samples_per_second": 899.991,
7
- "train_steps_per_second": 3.68
8
  }
 
1
  {
2
  "epoch": 12.0,
3
+ "train_loss": 0.14563740226957533,
4
+ "train_runtime": 96.9183,
5
  "train_samples": 3668,
6
+ "train_samples_per_second": 1892.315,
7
+ "train_steps_per_second": 7.738
8
  }
trainer_state.json CHANGED
@@ -138,9 +138,9 @@
138
  "eval_combined_score": 0.7477645971225257,
139
  "eval_f1": 0.8019017432646594,
140
  "eval_loss": 0.6560007929801941,
141
- "eval_runtime": 0.515,
142
- "eval_samples_per_second": 792.192,
143
- "eval_steps_per_second": 3.883,
144
  "step": 120
145
  },
146
  {
@@ -156,7 +156,7 @@
156
  "eval_f1": 0.7678244972577698,
157
  "eval_loss": 0.6672889590263367,
158
  "eval_runtime": 0.5142,
159
- "eval_samples_per_second": 793.515,
160
  "eval_steps_per_second": 3.89,
161
  "step": 135
162
  },
@@ -172,9 +172,9 @@
172
  "eval_combined_score": 0.7382192221150756,
173
  "eval_f1": 0.7901639344262296,
174
  "eval_loss": 0.8091686367988586,
175
- "eval_runtime": 0.5155,
176
- "eval_samples_per_second": 791.402,
177
- "eval_steps_per_second": 3.879,
178
  "step": 150
179
  },
180
  {
@@ -190,7 +190,7 @@
190
  "eval_f1": 0.7934959349593496,
191
  "eval_loss": 0.9342193603515625,
192
  "eval_runtime": 0.5139,
193
- "eval_samples_per_second": 793.922,
194
  "eval_steps_per_second": 3.892,
195
  "step": 165
196
  },
@@ -206,19 +206,19 @@
206
  "eval_combined_score": 0.7324041246379707,
207
  "eval_f1": 0.7809847198641766,
208
  "eval_loss": 0.9707943201065063,
209
- "eval_runtime": 0.5142,
210
- "eval_samples_per_second": 793.529,
211
- "eval_steps_per_second": 3.89,
212
  "step": 180
213
  },
214
  {
215
  "epoch": 12.0,
216
  "step": 180,
217
  "total_flos": 5559706315653120.0,
218
- "train_loss": 0.4964691546228197,
219
- "train_runtime": 203.7797,
220
- "train_samples_per_second": 899.991,
221
- "train_steps_per_second": 3.68
222
  }
223
  ],
224
  "max_steps": 750,
 
138
  "eval_combined_score": 0.7477645971225257,
139
  "eval_f1": 0.8019017432646594,
140
  "eval_loss": 0.6560007929801941,
141
+ "eval_runtime": 0.5165,
142
+ "eval_samples_per_second": 789.95,
143
+ "eval_steps_per_second": 3.872,
144
  "step": 120
145
  },
146
  {
 
156
  "eval_f1": 0.7678244972577698,
157
  "eval_loss": 0.6672889590263367,
158
  "eval_runtime": 0.5142,
159
+ "eval_samples_per_second": 793.531,
160
  "eval_steps_per_second": 3.89,
161
  "step": 135
162
  },
 
172
  "eval_combined_score": 0.7382192221150756,
173
  "eval_f1": 0.7901639344262296,
174
  "eval_loss": 0.8091686367988586,
175
+ "eval_runtime": 0.5146,
176
+ "eval_samples_per_second": 792.772,
177
+ "eval_steps_per_second": 3.886,
178
  "step": 150
179
  },
180
  {
 
190
  "eval_f1": 0.7934959349593496,
191
  "eval_loss": 0.9342193603515625,
192
  "eval_runtime": 0.5139,
193
+ "eval_samples_per_second": 793.879,
194
  "eval_steps_per_second": 3.892,
195
  "step": 165
196
  },
 
206
  "eval_combined_score": 0.7324041246379707,
207
  "eval_f1": 0.7809847198641766,
208
  "eval_loss": 0.9707943201065063,
209
+ "eval_runtime": 0.5166,
210
+ "eval_samples_per_second": 789.753,
211
+ "eval_steps_per_second": 3.871,
212
  "step": 180
213
  },
214
  {
215
  "epoch": 12.0,
216
  "step": 180,
217
  "total_flos": 5559706315653120.0,
218
+ "train_loss": 0.14563740226957533,
219
+ "train_runtime": 96.9183,
220
+ "train_samples_per_second": 1892.315,
221
+ "train_steps_per_second": 7.738
222
  }
223
  ],
224
  "max_steps": 750,