gokulsrinivasagan commited on
Commit
d6b2520
·
verified ·
1 Parent(s): b11b07e

End of training

Browse files
README.md CHANGED
@@ -1,14 +1,32 @@
1
  ---
2
  library_name: transformers
 
 
3
  base_model: gokulsrinivasagan/bert_tiny_lda_20
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - accuracy
8
  - f1
9
  model-index:
10
  - name: bert_tiny_lda_20_mrpc
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,9 +34,9 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # bert_tiny_lda_20_mrpc
18
 
19
- This model is a fine-tuned version of [gokulsrinivasagan/bert_tiny_lda_20](https://huggingface.co/gokulsrinivasagan/bert_tiny_lda_20) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.6279
22
  - Accuracy: 0.6838
23
  - F1: 0.8122
24
  - Combined Score: 0.7480
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  base_model: gokulsrinivasagan/bert_tiny_lda_20
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - glue
10
  metrics:
11
  - accuracy
12
  - f1
13
  model-index:
14
  - name: bert_tiny_lda_20_mrpc
15
+ results:
16
+ - task:
17
+ name: Text Classification
18
+ type: text-classification
19
+ dataset:
20
+ name: GLUE MRPC
21
+ type: glue
22
+ args: mrpc
23
+ metrics:
24
+ - name: Accuracy
25
+ type: accuracy
26
+ value: 0.6838235294117647
27
+ - name: F1
28
+ type: f1
29
+ value: 0.8122270742358079
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  # bert_tiny_lda_20_mrpc
36
 
37
+ This model is a fine-tuned version of [gokulsrinivasagan/bert_tiny_lda_20](https://huggingface.co/gokulsrinivasagan/bert_tiny_lda_20) on the GLUE MRPC dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.6247
40
  - Accuracy: 0.6838
41
  - F1: 0.8122
42
  - Combined Score: 0.7480
all_results.json CHANGED
@@ -3,15 +3,15 @@
3
  "eval_accuracy": 0.6838235294117647,
4
  "eval_combined_score": 0.7480253018237863,
5
  "eval_f1": 0.8122270742358079,
6
- "eval_loss": 0.6239542961120605,
7
- "eval_runtime": 0.3395,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1201.848,
10
- "eval_steps_per_second": 14.729,
11
  "total_flos": 865692760633344.0,
12
- "train_loss": 0.6400821718395265,
13
- "train_runtime": 79.8923,
14
  "train_samples": 3668,
15
- "train_samples_per_second": 1377.354,
16
- "train_steps_per_second": 14.645
17
  }
 
3
  "eval_accuracy": 0.6838235294117647,
4
  "eval_combined_score": 0.7480253018237863,
5
  "eval_f1": 0.8122270742358079,
6
+ "eval_loss": 0.6246840357780457,
7
+ "eval_runtime": 0.1368,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 2982.731,
10
+ "eval_steps_per_second": 14.621,
11
  "total_flos": 865692760633344.0,
12
+ "train_loss": 0.35235131635964767,
13
+ "train_runtime": 15.55,
14
  "train_samples": 3668,
15
+ "train_samples_per_second": 7076.519,
16
+ "train_steps_per_second": 75.241
17
  }
eval_results.json CHANGED
@@ -3,9 +3,9 @@
3
  "eval_accuracy": 0.6838235294117647,
4
  "eval_combined_score": 0.7480253018237863,
5
  "eval_f1": 0.8122270742358079,
6
- "eval_loss": 0.6239542961120605,
7
- "eval_runtime": 0.3395,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1201.848,
10
- "eval_steps_per_second": 14.729
11
  }
 
3
  "eval_accuracy": 0.6838235294117647,
4
  "eval_combined_score": 0.7480253018237863,
5
  "eval_f1": 0.8122270742358079,
6
+ "eval_loss": 0.6246840357780457,
7
+ "eval_runtime": 0.1368,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 2982.731,
10
+ "eval_steps_per_second": 14.621
11
  }
logs/events.out.tfevents.1732251623.ki-g0008.1610732.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b57bc5880eaa4747a794bbab1b4de0de131f24a7757572355f2c9ecd9846a171
3
+ size 515
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 9.0,
3
  "total_flos": 865692760633344.0,
4
- "train_loss": 0.6400821718395265,
5
- "train_runtime": 79.8923,
6
  "train_samples": 3668,
7
- "train_samples_per_second": 1377.354,
8
- "train_steps_per_second": 14.645
9
  }
 
1
  {
2
  "epoch": 9.0,
3
  "total_flos": 865692760633344.0,
4
+ "train_loss": 0.35235131635964767,
5
+ "train_runtime": 15.55,
6
  "train_samples": 3668,
7
+ "train_samples_per_second": 7076.519,
8
+ "train_steps_per_second": 75.241
9
  }
trainer_state.json CHANGED
@@ -82,7 +82,7 @@
82
  },
83
  {
84
  "epoch": 5.0,
85
- "grad_norm": 1.0611114501953125,
86
  "learning_rate": 0.0008333333333333334,
87
  "loss": 0.6361,
88
  "step": 195
@@ -92,15 +92,15 @@
92
  "eval_accuracy": 0.6838235294117647,
93
  "eval_combined_score": 0.7480253018237863,
94
  "eval_f1": 0.8122270742358079,
95
- "eval_loss": 0.6252522468566895,
96
- "eval_runtime": 0.3312,
97
- "eval_samples_per_second": 1231.985,
98
- "eval_steps_per_second": 15.098,
99
  "step": 195
100
  },
101
  {
102
  "epoch": 6.0,
103
- "grad_norm": 2.5196642875671387,
104
  "learning_rate": 0.0008,
105
  "loss": 0.6372,
106
  "step": 234
@@ -110,17 +110,17 @@
110
  "eval_accuracy": 0.6838235294117647,
111
  "eval_combined_score": 0.7480253018237863,
112
  "eval_f1": 0.8122270742358079,
113
- "eval_loss": 0.6242114901542664,
114
- "eval_runtime": 0.3333,
115
- "eval_samples_per_second": 1223.974,
116
- "eval_steps_per_second": 15.0,
117
  "step": 234
118
  },
119
  {
120
  "epoch": 7.0,
121
- "grad_norm": 0.6646435856819153,
122
  "learning_rate": 0.0007666666666666667,
123
- "loss": 0.6325,
124
  "step": 273
125
  },
126
  {
@@ -128,15 +128,15 @@
128
  "eval_accuracy": 0.6838235294117647,
129
  "eval_combined_score": 0.7480253018237863,
130
  "eval_f1": 0.8122270742358079,
131
- "eval_loss": 0.6240382194519043,
132
- "eval_runtime": 0.3326,
133
- "eval_samples_per_second": 1226.748,
134
- "eval_steps_per_second": 15.034,
135
  "step": 273
136
  },
137
  {
138
  "epoch": 8.0,
139
- "grad_norm": 1.2900689840316772,
140
  "learning_rate": 0.0007333333333333333,
141
  "loss": 0.6344,
142
  "step": 312
@@ -146,17 +146,17 @@
146
  "eval_accuracy": 0.6838235294117647,
147
  "eval_combined_score": 0.7480253018237863,
148
  "eval_f1": 0.8122270742358079,
149
- "eval_loss": 0.6250187158584595,
150
- "eval_runtime": 0.3335,
151
- "eval_samples_per_second": 1223.535,
152
- "eval_steps_per_second": 14.994,
153
  "step": 312
154
  },
155
  {
156
  "epoch": 9.0,
157
- "grad_norm": 0.6405686736106873,
158
  "learning_rate": 0.0007,
159
- "loss": 0.6312,
160
  "step": 351
161
  },
162
  {
@@ -164,20 +164,20 @@
164
  "eval_accuracy": 0.6838235294117647,
165
  "eval_combined_score": 0.7480253018237863,
166
  "eval_f1": 0.8122270742358079,
167
- "eval_loss": 0.628382682800293,
168
- "eval_runtime": 0.3309,
169
- "eval_samples_per_second": 1232.846,
170
- "eval_steps_per_second": 15.108,
171
  "step": 351
172
  },
173
  {
174
  "epoch": 9.0,
175
  "step": 351,
176
  "total_flos": 865692760633344.0,
177
- "train_loss": 0.6400821718395265,
178
- "train_runtime": 79.8923,
179
- "train_samples_per_second": 1377.354,
180
- "train_steps_per_second": 14.645
181
  }
182
  ],
183
  "logging_steps": 1,
 
82
  },
83
  {
84
  "epoch": 5.0,
85
+ "grad_norm": 1.0560246706008911,
86
  "learning_rate": 0.0008333333333333334,
87
  "loss": 0.6361,
88
  "step": 195
 
92
  "eval_accuracy": 0.6838235294117647,
93
  "eval_combined_score": 0.7480253018237863,
94
  "eval_f1": 0.8122270742358079,
95
+ "eval_loss": 0.625359058380127,
96
+ "eval_runtime": 0.1374,
97
+ "eval_samples_per_second": 2968.497,
98
+ "eval_steps_per_second": 14.551,
99
  "step": 195
100
  },
101
  {
102
  "epoch": 6.0,
103
+ "grad_norm": 2.507007122039795,
104
  "learning_rate": 0.0008,
105
  "loss": 0.6372,
106
  "step": 234
 
110
  "eval_accuracy": 0.6838235294117647,
111
  "eval_combined_score": 0.7480253018237863,
112
  "eval_f1": 0.8122270742358079,
113
+ "eval_loss": 0.6243536472320557,
114
+ "eval_runtime": 0.1406,
115
+ "eval_samples_per_second": 2901.456,
116
+ "eval_steps_per_second": 14.223,
117
  "step": 234
118
  },
119
  {
120
  "epoch": 7.0,
121
+ "grad_norm": 0.6576654314994812,
122
  "learning_rate": 0.0007666666666666667,
123
+ "loss": 0.6324,
124
  "step": 273
125
  },
126
  {
 
128
  "eval_accuracy": 0.6838235294117647,
129
  "eval_combined_score": 0.7480253018237863,
130
  "eval_f1": 0.8122270742358079,
131
+ "eval_loss": 0.6248611807823181,
132
+ "eval_runtime": 0.1376,
133
+ "eval_samples_per_second": 2965.446,
134
+ "eval_steps_per_second": 14.537,
135
  "step": 273
136
  },
137
  {
138
  "epoch": 8.0,
139
+ "grad_norm": 1.2987427711486816,
140
  "learning_rate": 0.0007333333333333333,
141
  "loss": 0.6344,
142
  "step": 312
 
146
  "eval_accuracy": 0.6838235294117647,
147
  "eval_combined_score": 0.7480253018237863,
148
  "eval_f1": 0.8122270742358079,
149
+ "eval_loss": 0.6241096258163452,
150
+ "eval_runtime": 0.1631,
151
+ "eval_samples_per_second": 2501.529,
152
+ "eval_steps_per_second": 12.262,
153
  "step": 312
154
  },
155
  {
156
  "epoch": 9.0,
157
+ "grad_norm": 0.6472728848457336,
158
  "learning_rate": 0.0007,
159
+ "loss": 0.631,
160
  "step": 351
161
  },
162
  {
 
164
  "eval_accuracy": 0.6838235294117647,
165
  "eval_combined_score": 0.7480253018237863,
166
  "eval_f1": 0.8122270742358079,
167
+ "eval_loss": 0.6279440522193909,
168
+ "eval_runtime": 0.1342,
169
+ "eval_samples_per_second": 3041.182,
170
+ "eval_steps_per_second": 14.908,
171
  "step": 351
172
  },
173
  {
174
  "epoch": 9.0,
175
  "step": 351,
176
  "total_flos": 865692760633344.0,
177
+ "train_loss": 0.35235131635964767,
178
+ "train_runtime": 15.55,
179
+ "train_samples_per_second": 7076.519,
180
+ "train_steps_per_second": 75.241
181
  }
182
  ],
183
  "logging_steps": 1,