File size: 13,141 Bytes
ced1b5d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
{
  "best_metric": 0.8488700693681294,
  "best_model_checkpoint": "result/my-sup-simcse-roberta-large_filtered_final_augx_0517_275578",
  "epoch": 3.0,
  "global_step": 1617,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.05,
      "eval_avg_sts": 0.5474616885388701,
      "eval_sickr_spearman": 0.5431389131459742,
      "eval_stsb_spearman": 0.551784463931766,
      "step": 25
    },
    {
      "epoch": 0.09,
      "eval_avg_sts": 0.8135416256253626,
      "eval_sickr_spearman": 0.7961428840645369,
      "eval_stsb_spearman": 0.8309403671861882,
      "step": 50
    },
    {
      "epoch": 0.14,
      "eval_avg_sts": 0.8290864392720618,
      "eval_sickr_spearman": 0.8119339251910409,
      "eval_stsb_spearman": 0.8462389533530829,
      "step": 75
    },
    {
      "epoch": 0.19,
      "eval_avg_sts": 0.8323075552549601,
      "eval_sickr_spearman": 0.8165074947010796,
      "eval_stsb_spearman": 0.8481076158088408,
      "step": 100
    },
    {
      "epoch": 0.23,
      "eval_avg_sts": 0.8343864858126124,
      "eval_sickr_spearman": 0.8194722624684485,
      "eval_stsb_spearman": 0.8493007091567765,
      "step": 125
    },
    {
      "epoch": 0.28,
      "eval_avg_sts": 0.8378187523831807,
      "eval_sickr_spearman": 0.8246357979974512,
      "eval_stsb_spearman": 0.8510017067689102,
      "step": 150
    },
    {
      "epoch": 0.32,
      "eval_avg_sts": 0.8378495980528481,
      "eval_sickr_spearman": 0.8251682227568927,
      "eval_stsb_spearman": 0.8505309733488035,
      "step": 175
    },
    {
      "epoch": 0.37,
      "eval_avg_sts": 0.8368235864957789,
      "eval_sickr_spearman": 0.8220182470623785,
      "eval_stsb_spearman": 0.8516289259291794,
      "step": 200
    },
    {
      "epoch": 0.42,
      "eval_avg_sts": 0.8395252530386117,
      "eval_sickr_spearman": 0.8250073185670752,
      "eval_stsb_spearman": 0.8540431875101483,
      "step": 225
    },
    {
      "epoch": 0.46,
      "eval_avg_sts": 0.8379672358563708,
      "eval_sickr_spearman": 0.8226389049551619,
      "eval_stsb_spearman": 0.8532955667575798,
      "step": 250
    },
    {
      "epoch": 0.51,
      "eval_avg_sts": 0.8411570915382243,
      "eval_sickr_spearman": 0.827407480737039,
      "eval_stsb_spearman": 0.8549067023394095,
      "step": 275
    },
    {
      "epoch": 0.56,
      "eval_avg_sts": 0.8387757918913767,
      "eval_sickr_spearman": 0.8256738461617319,
      "eval_stsb_spearman": 0.8518777376210215,
      "step": 300
    },
    {
      "epoch": 0.6,
      "eval_avg_sts": 0.841718922029721,
      "eval_sickr_spearman": 0.8281196378780621,
      "eval_stsb_spearman": 0.8553182061813799,
      "step": 325
    },
    {
      "epoch": 0.65,
      "eval_avg_sts": 0.8436536599024109,
      "eval_sickr_spearman": 0.8272171815131412,
      "eval_stsb_spearman": 0.8600901382916806,
      "step": 350
    },
    {
      "epoch": 0.7,
      "eval_avg_sts": 0.8402882236960711,
      "eval_sickr_spearman": 0.8261090079407611,
      "eval_stsb_spearman": 0.854467439451381,
      "step": 375
    },
    {
      "epoch": 0.74,
      "eval_avg_sts": 0.8418557779216453,
      "eval_sickr_spearman": 0.8260196700920862,
      "eval_stsb_spearman": 0.8576918857512046,
      "step": 400
    },
    {
      "epoch": 0.79,
      "eval_avg_sts": 0.844240769517365,
      "eval_sickr_spearman": 0.8310969897940077,
      "eval_stsb_spearman": 0.8573845492407224,
      "step": 425
    },
    {
      "epoch": 0.83,
      "eval_avg_sts": 0.8400099841918098,
      "eval_sickr_spearman": 0.8256829240399036,
      "eval_stsb_spearman": 0.8543370443437162,
      "step": 450
    },
    {
      "epoch": 0.88,
      "eval_avg_sts": 0.8443099698070835,
      "eval_sickr_spearman": 0.8276297686744947,
      "eval_stsb_spearman": 0.8609901709396723,
      "step": 475
    },
    {
      "epoch": 0.93,
      "learning_rate": 6.907854050711195e-06,
      "loss": 0.524,
      "step": 500
    },
    {
      "epoch": 0.93,
      "eval_avg_sts": 0.8402789651908493,
      "eval_sickr_spearman": 0.8248319570157246,
      "eval_stsb_spearman": 0.8557259733659741,
      "step": 500
    },
    {
      "epoch": 0.97,
      "eval_avg_sts": 0.8461724605713624,
      "eval_sickr_spearman": 0.8330373021988031,
      "eval_stsb_spearman": 0.8593076189439217,
      "step": 525
    },
    {
      "epoch": 1.02,
      "eval_avg_sts": 0.8433982001182605,
      "eval_sickr_spearman": 0.8278159852547703,
      "eval_stsb_spearman": 0.8589804149817508,
      "step": 550
    },
    {
      "epoch": 1.07,
      "eval_avg_sts": 0.8449614978763837,
      "eval_sickr_spearman": 0.830460289513344,
      "eval_stsb_spearman": 0.8594627062394233,
      "step": 575
    },
    {
      "epoch": 1.11,
      "eval_avg_sts": 0.8455395546247182,
      "eval_sickr_spearman": 0.8325919578262689,
      "eval_stsb_spearman": 0.8584871514231674,
      "step": 600
    },
    {
      "epoch": 1.16,
      "eval_avg_sts": 0.8446314587494791,
      "eval_sickr_spearman": 0.8281194937847577,
      "eval_stsb_spearman": 0.8611434237142005,
      "step": 625
    },
    {
      "epoch": 1.21,
      "eval_avg_sts": 0.8450148030554683,
      "eval_sickr_spearman": 0.8291058604838908,
      "eval_stsb_spearman": 0.8609237456270458,
      "step": 650
    },
    {
      "epoch": 1.25,
      "eval_avg_sts": 0.8426975130677071,
      "eval_sickr_spearman": 0.8277219883892558,
      "eval_stsb_spearman": 0.8576730377461584,
      "step": 675
    },
    {
      "epoch": 1.3,
      "eval_avg_sts": 0.8422411960347308,
      "eval_sickr_spearman": 0.8265289438606347,
      "eval_stsb_spearman": 0.8579534482088269,
      "step": 700
    },
    {
      "epoch": 1.35,
      "eval_avg_sts": 0.8429589706818645,
      "eval_sickr_spearman": 0.8250001619329609,
      "eval_stsb_spearman": 0.8609177794307681,
      "step": 725
    },
    {
      "epoch": 1.39,
      "eval_avg_sts": 0.8412654164348794,
      "eval_sickr_spearman": 0.8244867094585874,
      "eval_stsb_spearman": 0.8580441234111714,
      "step": 750
    },
    {
      "epoch": 1.44,
      "eval_avg_sts": 0.8460400500676946,
      "eval_sickr_spearman": 0.8282549895219145,
      "eval_stsb_spearman": 0.8638251106134746,
      "step": 775
    },
    {
      "epoch": 1.48,
      "eval_avg_sts": 0.8419603634534258,
      "eval_sickr_spearman": 0.8271723684954995,
      "eval_stsb_spearman": 0.8567483584113522,
      "step": 800
    },
    {
      "epoch": 1.53,
      "eval_avg_sts": 0.8470667141064947,
      "eval_sickr_spearman": 0.8315851779090248,
      "eval_stsb_spearman": 0.8625482503039646,
      "step": 825
    },
    {
      "epoch": 1.58,
      "eval_avg_sts": 0.8445324992544034,
      "eval_sickr_spearman": 0.8299879516618016,
      "eval_stsb_spearman": 0.8590770468470054,
      "step": 850
    },
    {
      "epoch": 1.62,
      "eval_avg_sts": 0.847555914825822,
      "eval_sickr_spearman": 0.8307021261090849,
      "eval_stsb_spearman": 0.8644097035425593,
      "step": 875
    },
    {
      "epoch": 1.67,
      "eval_avg_sts": 0.846777031506697,
      "eval_sickr_spearman": 0.8312180762007332,
      "eval_stsb_spearman": 0.8623359868126609,
      "step": 900
    },
    {
      "epoch": 1.72,
      "eval_avg_sts": 0.8488700693681294,
      "eval_sickr_spearman": 0.8319676976008779,
      "eval_stsb_spearman": 0.8657724411353809,
      "step": 925
    },
    {
      "epoch": 1.76,
      "eval_avg_sts": 0.8447138350851642,
      "eval_sickr_spearman": 0.8262617468433344,
      "eval_stsb_spearman": 0.8631659233269939,
      "step": 950
    },
    {
      "epoch": 1.81,
      "eval_avg_sts": 0.8447763720006275,
      "eval_sickr_spearman": 0.8259132812024007,
      "eval_stsb_spearman": 0.8636394627988543,
      "step": 975
    },
    {
      "epoch": 1.86,
      "learning_rate": 3.815708101422388e-06,
      "loss": 0.2157,
      "step": 1000
    },
    {
      "epoch": 1.86,
      "eval_avg_sts": 0.8460663020851612,
      "eval_sickr_spearman": 0.8274893257338897,
      "eval_stsb_spearman": 0.8646432784364327,
      "step": 1000
    },
    {
      "epoch": 1.9,
      "eval_avg_sts": 0.8426466827719674,
      "eval_sickr_spearman": 0.8228687337755433,
      "eval_stsb_spearman": 0.8624246317683915,
      "step": 1025
    },
    {
      "epoch": 1.95,
      "eval_avg_sts": 0.8469945788874567,
      "eval_sickr_spearman": 0.8279081569384299,
      "eval_stsb_spearman": 0.8660810008364834,
      "step": 1050
    },
    {
      "epoch": 1.99,
      "eval_avg_sts": 0.844677174344695,
      "eval_sickr_spearman": 0.8273461450205025,
      "eval_stsb_spearman": 0.8620082036688875,
      "step": 1075
    },
    {
      "epoch": 2.04,
      "eval_avg_sts": 0.8446326323236237,
      "eval_sickr_spearman": 0.8279530179871731,
      "eval_stsb_spearman": 0.8613122466600744,
      "step": 1100
    },
    {
      "epoch": 2.09,
      "eval_avg_sts": 0.8468692691266899,
      "eval_sickr_spearman": 0.8292202225364149,
      "eval_stsb_spearman": 0.8645183157169649,
      "step": 1125
    },
    {
      "epoch": 2.13,
      "eval_avg_sts": 0.8471682137327401,
      "eval_sickr_spearman": 0.8307442013539448,
      "eval_stsb_spearman": 0.8635922261115354,
      "step": 1150
    },
    {
      "epoch": 2.18,
      "eval_avg_sts": 0.8446425133608689,
      "eval_sickr_spearman": 0.8279184355941376,
      "eval_stsb_spearman": 0.8613665911276003,
      "step": 1175
    },
    {
      "epoch": 2.23,
      "eval_avg_sts": 0.8447830471539575,
      "eval_sickr_spearman": 0.826634035910581,
      "eval_stsb_spearman": 0.8629320583973338,
      "step": 1200
    },
    {
      "epoch": 2.27,
      "eval_avg_sts": 0.8443517239023315,
      "eval_sickr_spearman": 0.8245701875128868,
      "eval_stsb_spearman": 0.8641332602917762,
      "step": 1225
    },
    {
      "epoch": 2.32,
      "eval_avg_sts": 0.8436894469588044,
      "eval_sickr_spearman": 0.8249284034674125,
      "eval_stsb_spearman": 0.8624504904501964,
      "step": 1250
    },
    {
      "epoch": 2.37,
      "eval_avg_sts": 0.8446249300083088,
      "eval_sickr_spearman": 0.8268909542721736,
      "eval_stsb_spearman": 0.862358905744444,
      "step": 1275
    },
    {
      "epoch": 2.41,
      "eval_avg_sts": 0.8460631153640206,
      "eval_sickr_spearman": 0.8276132459755998,
      "eval_stsb_spearman": 0.8645129847524413,
      "step": 1300
    },
    {
      "epoch": 2.46,
      "eval_avg_sts": 0.8450409206315745,
      "eval_sickr_spearman": 0.8269633851731423,
      "eval_stsb_spearman": 0.8631184560900067,
      "step": 1325
    },
    {
      "epoch": 2.5,
      "eval_avg_sts": 0.8444144648283911,
      "eval_sickr_spearman": 0.8256842208796424,
      "eval_stsb_spearman": 0.8631447087771397,
      "step": 1350
    },
    {
      "epoch": 2.55,
      "eval_avg_sts": 0.8441319770667891,
      "eval_sickr_spearman": 0.8250716322119007,
      "eval_stsb_spearman": 0.8631923219216775,
      "step": 1375
    },
    {
      "epoch": 2.6,
      "eval_avg_sts": 0.8440921655811744,
      "eval_sickr_spearman": 0.825079557343638,
      "eval_stsb_spearman": 0.8631047738187106,
      "step": 1400
    },
    {
      "epoch": 2.64,
      "eval_avg_sts": 0.8442932554429321,
      "eval_sickr_spearman": 0.8250880108174912,
      "eval_stsb_spearman": 0.863498500068373,
      "step": 1425
    },
    {
      "epoch": 2.69,
      "eval_avg_sts": 0.8458752869787667,
      "eval_sickr_spearman": 0.8263863875515662,
      "eval_stsb_spearman": 0.865364186405967,
      "step": 1450
    },
    {
      "epoch": 2.74,
      "eval_avg_sts": 0.8455124701644118,
      "eval_sickr_spearman": 0.8256285528330758,
      "eval_stsb_spearman": 0.8653963874957478,
      "step": 1475
    },
    {
      "epoch": 2.78,
      "learning_rate": 7.235621521335808e-07,
      "loss": 0.2017,
      "step": 1500
    },
    {
      "epoch": 2.78,
      "eval_avg_sts": 0.8463352416025529,
      "eval_sickr_spearman": 0.8273291420105935,
      "eval_stsb_spearman": 0.8653413411945124,
      "step": 1500
    },
    {
      "epoch": 2.83,
      "eval_avg_sts": 0.8451320979354053,
      "eval_sickr_spearman": 0.8257100135811147,
      "eval_stsb_spearman": 0.8645541822896958,
      "step": 1525
    },
    {
      "epoch": 2.88,
      "eval_avg_sts": 0.8447004499326362,
      "eval_sickr_spearman": 0.8251015273595114,
      "eval_stsb_spearman": 0.8642993725057609,
      "step": 1550
    },
    {
      "epoch": 2.92,
      "eval_avg_sts": 0.8451416986583431,
      "eval_sickr_spearman": 0.8259361920377868,
      "eval_stsb_spearman": 0.8643472052788993,
      "step": 1575
    },
    {
      "epoch": 2.97,
      "eval_avg_sts": 0.8452566149686973,
      "eval_sickr_spearman": 0.8260989214094591,
      "eval_stsb_spearman": 0.8644143085279357,
      "step": 1600
    },
    {
      "epoch": 3.0,
      "step": 1617,
      "train_runtime": 3774.3125,
      "train_samples_per_second": 0.428
    }
  ],
  "max_steps": 1617,
  "num_train_epochs": 3,
  "total_flos": 388517232930716160,
  "trial_name": null,
  "trial_params": null
}