jorgeortizfuentes
commited on
Commit
·
9cd0ca3
1
Parent(s):
195317b
End of training
Browse files- all_results.json +5 -5
- predict_results_spanish-offensive-language.txt +70 -70
- train_results.json +5 -5
- trainer_state.json +43 -28
all_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 7964,
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second": 2.
|
8 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 3.0,
|
3 |
+
"train_loss": 0.5543336676785267,
|
4 |
+
"train_runtime": 347.758,
|
5 |
"train_samples": 7964,
|
6 |
+
"train_samples_per_second": 68.703,
|
7 |
+
"train_steps_per_second": 2.864
|
8 |
}
|
predict_results_spanish-offensive-language.txt
CHANGED
@@ -1,16 +1,16 @@
|
|
1 |
index prediction
|
2 |
-
0
|
3 |
1 1
|
4 |
2 0
|
5 |
3 1
|
6 |
4 0
|
7 |
5 1
|
8 |
-
6
|
9 |
7 1
|
10 |
8 1
|
11 |
9 1
|
12 |
10 1
|
13 |
-
11
|
14 |
12 1
|
15 |
13 0
|
16 |
14 1
|
@@ -24,10 +24,10 @@ index prediction
|
|
24 |
22 1
|
25 |
23 1
|
26 |
24 0
|
27 |
-
25
|
28 |
26 1
|
29 |
27 1
|
30 |
-
28
|
31 |
29 0
|
32 |
30 0
|
33 |
31 1
|
@@ -60,7 +60,7 @@ index prediction
|
|
60 |
58 1
|
61 |
59 1
|
62 |
60 1
|
63 |
-
61
|
64 |
62 1
|
65 |
63 0
|
66 |
64 1
|
@@ -72,7 +72,7 @@ index prediction
|
|
72 |
70 1
|
73 |
71 1
|
74 |
72 1
|
75 |
-
73
|
76 |
74 0
|
77 |
75 1
|
78 |
76 1
|
@@ -91,7 +91,7 @@ index prediction
|
|
91 |
89 1
|
92 |
90 1
|
93 |
91 1
|
94 |
-
92
|
95 |
93 1
|
96 |
94 1
|
97 |
95 1
|
@@ -120,11 +120,11 @@ index prediction
|
|
120 |
118 1
|
121 |
119 0
|
122 |
120 1
|
123 |
-
121
|
124 |
122 0
|
125 |
123 1
|
126 |
124 1
|
127 |
-
125
|
128 |
126 1
|
129 |
127 1
|
130 |
128 1
|
@@ -159,7 +159,7 @@ index prediction
|
|
159 |
157 1
|
160 |
158 1
|
161 |
159 1
|
162 |
-
160
|
163 |
161 1
|
164 |
162 1
|
165 |
163 1
|
@@ -175,11 +175,11 @@ index prediction
|
|
175 |
173 1
|
176 |
174 1
|
177 |
175 1
|
178 |
-
176
|
179 |
177 0
|
180 |
178 1
|
181 |
-
179
|
182 |
-
180
|
183 |
181 1
|
184 |
182 1
|
185 |
183 1
|
@@ -212,9 +212,9 @@ index prediction
|
|
212 |
210 1
|
213 |
211 1
|
214 |
212 1
|
215 |
-
213
|
216 |
214 1
|
217 |
-
215
|
218 |
216 0
|
219 |
217 0
|
220 |
218 1
|
@@ -227,11 +227,11 @@ index prediction
|
|
227 |
225 1
|
228 |
226 1
|
229 |
227 1
|
230 |
-
228
|
231 |
229 0
|
232 |
230 1
|
233 |
231 1
|
234 |
-
232
|
235 |
233 1
|
236 |
234 0
|
237 |
235 0
|
@@ -251,7 +251,7 @@ index prediction
|
|
251 |
249 1
|
252 |
250 1
|
253 |
251 1
|
254 |
-
252
|
255 |
253 1
|
256 |
254 1
|
257 |
255 0
|
@@ -259,7 +259,7 @@ index prediction
|
|
259 |
257 1
|
260 |
258 1
|
261 |
259 0
|
262 |
-
260
|
263 |
261 1
|
264 |
262 0
|
265 |
263 1
|
@@ -271,7 +271,7 @@ index prediction
|
|
271 |
269 1
|
272 |
270 1
|
273 |
271 1
|
274 |
-
272
|
275 |
273 1
|
276 |
274 1
|
277 |
275 1
|
@@ -297,8 +297,8 @@ index prediction
|
|
297 |
295 0
|
298 |
296 1
|
299 |
297 1
|
300 |
-
298
|
301 |
-
299
|
302 |
300 1
|
303 |
301 1
|
304 |
302 0
|
@@ -314,7 +314,7 @@ index prediction
|
|
314 |
312 1
|
315 |
313 1
|
316 |
314 1
|
317 |
-
315
|
318 |
316 1
|
319 |
317 1
|
320 |
318 1
|
@@ -330,7 +330,7 @@ index prediction
|
|
330 |
328 1
|
331 |
329 0
|
332 |
330 1
|
333 |
-
331
|
334 |
332 1
|
335 |
333 1
|
336 |
334 1
|
@@ -340,7 +340,7 @@ index prediction
|
|
340 |
338 0
|
341 |
339 0
|
342 |
340 1
|
343 |
-
341
|
344 |
342 0
|
345 |
343 0
|
346 |
344 1
|
@@ -358,16 +358,16 @@ index prediction
|
|
358 |
356 0
|
359 |
357 1
|
360 |
358 1
|
361 |
-
359
|
362 |
360 1
|
363 |
361 1
|
364 |
362 1
|
365 |
363 1
|
366 |
364 1
|
367 |
-
365
|
368 |
-
366
|
369 |
367 1
|
370 |
-
368
|
371 |
369 1
|
372 |
370 1
|
373 |
371 1
|
@@ -376,7 +376,7 @@ index prediction
|
|
376 |
374 0
|
377 |
375 1
|
378 |
376 1
|
379 |
-
377
|
380 |
378 1
|
381 |
379 1
|
382 |
380 0
|
@@ -388,7 +388,7 @@ index prediction
|
|
388 |
386 1
|
389 |
387 1
|
390 |
388 1
|
391 |
-
389
|
392 |
390 1
|
393 |
391 0
|
394 |
392 1
|
@@ -396,7 +396,7 @@ index prediction
|
|
396 |
394 1
|
397 |
395 1
|
398 |
396 1
|
399 |
-
397
|
400 |
398 1
|
401 |
399 1
|
402 |
400 1
|
@@ -406,18 +406,18 @@ index prediction
|
|
406 |
404 0
|
407 |
405 1
|
408 |
406 0
|
409 |
-
407
|
410 |
408 1
|
411 |
409 1
|
412 |
410 0
|
413 |
411 0
|
414 |
412 1
|
415 |
413 1
|
416 |
-
414
|
417 |
415 1
|
418 |
416 0
|
419 |
-
417
|
420 |
-
418
|
421 |
419 0
|
422 |
420 1
|
423 |
421 1
|
@@ -427,7 +427,7 @@ index prediction
|
|
427 |
425 1
|
428 |
426 1
|
429 |
427 1
|
430 |
-
428
|
431 |
429 0
|
432 |
430 1
|
433 |
431 1
|
@@ -446,7 +446,7 @@ index prediction
|
|
446 |
444 1
|
447 |
445 0
|
448 |
446 1
|
449 |
-
447
|
450 |
448 1
|
451 |
449 1
|
452 |
450 1
|
@@ -480,14 +480,14 @@ index prediction
|
|
480 |
478 1
|
481 |
479 1
|
482 |
480 0
|
483 |
-
481
|
484 |
482 1
|
485 |
483 1
|
486 |
484 1
|
487 |
485 1
|
488 |
-
486
|
489 |
487 1
|
490 |
-
488
|
491 |
489 1
|
492 |
490 1
|
493 |
491 1
|
@@ -507,13 +507,13 @@ index prediction
|
|
507 |
505 1
|
508 |
506 1
|
509 |
507 1
|
510 |
-
508
|
511 |
509 1
|
512 |
510 1
|
513 |
511 0
|
514 |
512 1
|
515 |
513 1
|
516 |
-
514
|
517 |
515 1
|
518 |
516 1
|
519 |
517 1
|
@@ -541,7 +541,7 @@ index prediction
|
|
541 |
539 1
|
542 |
540 1
|
543 |
541 1
|
544 |
-
542
|
545 |
543 1
|
546 |
544 0
|
547 |
545 0
|
@@ -558,7 +558,7 @@ index prediction
|
|
558 |
556 0
|
559 |
557 1
|
560 |
558 1
|
561 |
-
559
|
562 |
560 1
|
563 |
561 1
|
564 |
562 0
|
@@ -567,22 +567,22 @@ index prediction
|
|
567 |
565 1
|
568 |
566 1
|
569 |
567 1
|
570 |
-
568
|
571 |
569 1
|
572 |
570 0
|
573 |
571 1
|
574 |
572 1
|
575 |
-
573
|
576 |
574 1
|
577 |
575 1
|
578 |
576 1
|
579 |
577 1
|
580 |
578 1
|
581 |
-
579
|
582 |
580 1
|
583 |
581 1
|
584 |
582 0
|
585 |
-
583
|
586 |
584 1
|
587 |
585 1
|
588 |
586 1
|
@@ -611,14 +611,14 @@ index prediction
|
|
611 |
609 1
|
612 |
610 0
|
613 |
611 1
|
614 |
-
612
|
615 |
613 1
|
616 |
614 1
|
617 |
615 1
|
618 |
616 1
|
619 |
617 1
|
620 |
618 1
|
621 |
-
619
|
622 |
620 1
|
623 |
621 1
|
624 |
622 1
|
@@ -633,7 +633,7 @@ index prediction
|
|
633 |
631 1
|
634 |
632 1
|
635 |
633 1
|
636 |
-
634
|
637 |
635 1
|
638 |
636 1
|
639 |
637 1
|
@@ -644,7 +644,7 @@ index prediction
|
|
644 |
642 1
|
645 |
643 1
|
646 |
644 1
|
647 |
-
645
|
648 |
646 1
|
649 |
647 1
|
650 |
648 0
|
@@ -657,12 +657,12 @@ index prediction
|
|
657 |
655 1
|
658 |
656 1
|
659 |
657 1
|
660 |
-
658
|
661 |
-
659
|
662 |
660 1
|
663 |
661 1
|
664 |
662 1
|
665 |
-
663
|
666 |
664 1
|
667 |
665 1
|
668 |
666 1
|
@@ -697,13 +697,13 @@ index prediction
|
|
697 |
695 1
|
698 |
696 1
|
699 |
697 1
|
700 |
-
698
|
701 |
699 1
|
702 |
700 1
|
703 |
701 1
|
704 |
702 1
|
705 |
703 0
|
706 |
-
704
|
707 |
705 1
|
708 |
706 0
|
709 |
707 1
|
@@ -715,7 +715,7 @@ index prediction
|
|
715 |
713 1
|
716 |
714 1
|
717 |
715 1
|
718 |
-
716
|
719 |
717 1
|
720 |
718 1
|
721 |
719 1
|
@@ -754,11 +754,11 @@ index prediction
|
|
754 |
752 1
|
755 |
753 1
|
756 |
754 1
|
757 |
-
755
|
758 |
756 1
|
759 |
757 1
|
760 |
758 1
|
761 |
-
759
|
762 |
760 1
|
763 |
761 1
|
764 |
762 0
|
@@ -772,7 +772,7 @@ index prediction
|
|
772 |
770 0
|
773 |
771 1
|
774 |
772 1
|
775 |
-
773
|
776 |
774 0
|
777 |
775 1
|
778 |
776 0
|
@@ -780,13 +780,13 @@ index prediction
|
|
780 |
778 1
|
781 |
779 1
|
782 |
780 1
|
783 |
-
781
|
784 |
782 1
|
785 |
-
783
|
786 |
784 1
|
787 |
785 1
|
788 |
786 1
|
789 |
-
787
|
790 |
788 1
|
791 |
789 1
|
792 |
790 1
|
@@ -829,9 +829,9 @@ index prediction
|
|
829 |
827 1
|
830 |
828 1
|
831 |
829 1
|
832 |
-
830
|
833 |
831 1
|
834 |
-
832
|
835 |
833 1
|
836 |
834 1
|
837 |
835 1
|
@@ -865,7 +865,7 @@ index prediction
|
|
865 |
863 1
|
866 |
864 1
|
867 |
865 1
|
868 |
-
866
|
869 |
867 0
|
870 |
868 0
|
871 |
869 1
|
@@ -877,7 +877,7 @@ index prediction
|
|
877 |
875 1
|
878 |
876 1
|
879 |
877 1
|
880 |
-
878
|
881 |
879 0
|
882 |
880 0
|
883 |
881 1
|
|
|
1 |
index prediction
|
2 |
+
0 0
|
3 |
1 1
|
4 |
2 0
|
5 |
3 1
|
6 |
4 0
|
7 |
5 1
|
8 |
+
6 0
|
9 |
7 1
|
10 |
8 1
|
11 |
9 1
|
12 |
10 1
|
13 |
+
11 0
|
14 |
12 1
|
15 |
13 0
|
16 |
14 1
|
|
|
24 |
22 1
|
25 |
23 1
|
26 |
24 0
|
27 |
+
25 0
|
28 |
26 1
|
29 |
27 1
|
30 |
+
28 0
|
31 |
29 0
|
32 |
30 0
|
33 |
31 1
|
|
|
60 |
58 1
|
61 |
59 1
|
62 |
60 1
|
63 |
+
61 0
|
64 |
62 1
|
65 |
63 0
|
66 |
64 1
|
|
|
72 |
70 1
|
73 |
71 1
|
74 |
72 1
|
75 |
+
73 0
|
76 |
74 0
|
77 |
75 1
|
78 |
76 1
|
|
|
91 |
89 1
|
92 |
90 1
|
93 |
91 1
|
94 |
+
92 0
|
95 |
93 1
|
96 |
94 1
|
97 |
95 1
|
|
|
120 |
118 1
|
121 |
119 0
|
122 |
120 1
|
123 |
+
121 1
|
124 |
122 0
|
125 |
123 1
|
126 |
124 1
|
127 |
+
125 0
|
128 |
126 1
|
129 |
127 1
|
130 |
128 1
|
|
|
159 |
157 1
|
160 |
158 1
|
161 |
159 1
|
162 |
+
160 1
|
163 |
161 1
|
164 |
162 1
|
165 |
163 1
|
|
|
175 |
173 1
|
176 |
174 1
|
177 |
175 1
|
178 |
+
176 0
|
179 |
177 0
|
180 |
178 1
|
181 |
+
179 1
|
182 |
+
180 0
|
183 |
181 1
|
184 |
182 1
|
185 |
183 1
|
|
|
212 |
210 1
|
213 |
211 1
|
214 |
212 1
|
215 |
+
213 0
|
216 |
214 1
|
217 |
+
215 1
|
218 |
216 0
|
219 |
217 0
|
220 |
218 1
|
|
|
227 |
225 1
|
228 |
226 1
|
229 |
227 1
|
230 |
+
228 0
|
231 |
229 0
|
232 |
230 1
|
233 |
231 1
|
234 |
+
232 0
|
235 |
233 1
|
236 |
234 0
|
237 |
235 0
|
|
|
251 |
249 1
|
252 |
250 1
|
253 |
251 1
|
254 |
+
252 0
|
255 |
253 1
|
256 |
254 1
|
257 |
255 0
|
|
|
259 |
257 1
|
260 |
258 1
|
261 |
259 0
|
262 |
+
260 0
|
263 |
261 1
|
264 |
262 0
|
265 |
263 1
|
|
|
271 |
269 1
|
272 |
270 1
|
273 |
271 1
|
274 |
+
272 0
|
275 |
273 1
|
276 |
274 1
|
277 |
275 1
|
|
|
297 |
295 0
|
298 |
296 1
|
299 |
297 1
|
300 |
+
298 0
|
301 |
+
299 0
|
302 |
300 1
|
303 |
301 1
|
304 |
302 0
|
|
|
314 |
312 1
|
315 |
313 1
|
316 |
314 1
|
317 |
+
315 0
|
318 |
316 1
|
319 |
317 1
|
320 |
318 1
|
|
|
330 |
328 1
|
331 |
329 0
|
332 |
330 1
|
333 |
+
331 0
|
334 |
332 1
|
335 |
333 1
|
336 |
334 1
|
|
|
340 |
338 0
|
341 |
339 0
|
342 |
340 1
|
343 |
+
341 0
|
344 |
342 0
|
345 |
343 0
|
346 |
344 1
|
|
|
358 |
356 0
|
359 |
357 1
|
360 |
358 1
|
361 |
+
359 0
|
362 |
360 1
|
363 |
361 1
|
364 |
362 1
|
365 |
363 1
|
366 |
364 1
|
367 |
+
365 0
|
368 |
+
366 0
|
369 |
367 1
|
370 |
+
368 0
|
371 |
369 1
|
372 |
370 1
|
373 |
371 1
|
|
|
376 |
374 0
|
377 |
375 1
|
378 |
376 1
|
379 |
+
377 0
|
380 |
378 1
|
381 |
379 1
|
382 |
380 0
|
|
|
388 |
386 1
|
389 |
387 1
|
390 |
388 1
|
391 |
+
389 1
|
392 |
390 1
|
393 |
391 0
|
394 |
392 1
|
|
|
396 |
394 1
|
397 |
395 1
|
398 |
396 1
|
399 |
+
397 1
|
400 |
398 1
|
401 |
399 1
|
402 |
400 1
|
|
|
406 |
404 0
|
407 |
405 1
|
408 |
406 0
|
409 |
+
407 0
|
410 |
408 1
|
411 |
409 1
|
412 |
410 0
|
413 |
411 0
|
414 |
412 1
|
415 |
413 1
|
416 |
+
414 0
|
417 |
415 1
|
418 |
416 0
|
419 |
+
417 0
|
420 |
+
418 1
|
421 |
419 0
|
422 |
420 1
|
423 |
421 1
|
|
|
427 |
425 1
|
428 |
426 1
|
429 |
427 1
|
430 |
+
428 0
|
431 |
429 0
|
432 |
430 1
|
433 |
431 1
|
|
|
446 |
444 1
|
447 |
445 0
|
448 |
446 1
|
449 |
+
447 0
|
450 |
448 1
|
451 |
449 1
|
452 |
450 1
|
|
|
480 |
478 1
|
481 |
479 1
|
482 |
480 0
|
483 |
+
481 0
|
484 |
482 1
|
485 |
483 1
|
486 |
484 1
|
487 |
485 1
|
488 |
+
486 0
|
489 |
487 1
|
490 |
+
488 0
|
491 |
489 1
|
492 |
490 1
|
493 |
491 1
|
|
|
507 |
505 1
|
508 |
506 1
|
509 |
507 1
|
510 |
+
508 0
|
511 |
509 1
|
512 |
510 1
|
513 |
511 0
|
514 |
512 1
|
515 |
513 1
|
516 |
+
514 0
|
517 |
515 1
|
518 |
516 1
|
519 |
517 1
|
|
|
541 |
539 1
|
542 |
540 1
|
543 |
541 1
|
544 |
+
542 0
|
545 |
543 1
|
546 |
544 0
|
547 |
545 0
|
|
|
558 |
556 0
|
559 |
557 1
|
560 |
558 1
|
561 |
+
559 0
|
562 |
560 1
|
563 |
561 1
|
564 |
562 0
|
|
|
567 |
565 1
|
568 |
566 1
|
569 |
567 1
|
570 |
+
568 1
|
571 |
569 1
|
572 |
570 0
|
573 |
571 1
|
574 |
572 1
|
575 |
+
573 1
|
576 |
574 1
|
577 |
575 1
|
578 |
576 1
|
579 |
577 1
|
580 |
578 1
|
581 |
+
579 0
|
582 |
580 1
|
583 |
581 1
|
584 |
582 0
|
585 |
+
583 0
|
586 |
584 1
|
587 |
585 1
|
588 |
586 1
|
|
|
611 |
609 1
|
612 |
610 0
|
613 |
611 1
|
614 |
+
612 0
|
615 |
613 1
|
616 |
614 1
|
617 |
615 1
|
618 |
616 1
|
619 |
617 1
|
620 |
618 1
|
621 |
+
619 0
|
622 |
620 1
|
623 |
621 1
|
624 |
622 1
|
|
|
633 |
631 1
|
634 |
632 1
|
635 |
633 1
|
636 |
+
634 0
|
637 |
635 1
|
638 |
636 1
|
639 |
637 1
|
|
|
644 |
642 1
|
645 |
643 1
|
646 |
644 1
|
647 |
+
645 0
|
648 |
646 1
|
649 |
647 1
|
650 |
648 0
|
|
|
657 |
655 1
|
658 |
656 1
|
659 |
657 1
|
660 |
+
658 0
|
661 |
+
659 0
|
662 |
660 1
|
663 |
661 1
|
664 |
662 1
|
665 |
+
663 0
|
666 |
664 1
|
667 |
665 1
|
668 |
666 1
|
|
|
697 |
695 1
|
698 |
696 1
|
699 |
697 1
|
700 |
+
698 0
|
701 |
699 1
|
702 |
700 1
|
703 |
701 1
|
704 |
702 1
|
705 |
703 0
|
706 |
+
704 0
|
707 |
705 1
|
708 |
706 0
|
709 |
707 1
|
|
|
715 |
713 1
|
716 |
714 1
|
717 |
715 1
|
718 |
+
716 0
|
719 |
717 1
|
720 |
718 1
|
721 |
719 1
|
|
|
754 |
752 1
|
755 |
753 1
|
756 |
754 1
|
757 |
+
755 0
|
758 |
756 1
|
759 |
757 1
|
760 |
758 1
|
761 |
+
759 0
|
762 |
760 1
|
763 |
761 1
|
764 |
762 0
|
|
|
772 |
770 0
|
773 |
771 1
|
774 |
772 1
|
775 |
+
773 0
|
776 |
774 0
|
777 |
775 1
|
778 |
776 0
|
|
|
780 |
778 1
|
781 |
779 1
|
782 |
780 1
|
783 |
+
781 1
|
784 |
782 1
|
785 |
+
783 0
|
786 |
784 1
|
787 |
785 1
|
788 |
786 1
|
789 |
+
787 0
|
790 |
788 1
|
791 |
789 1
|
792 |
790 1
|
|
|
829 |
827 1
|
830 |
828 1
|
831 |
829 1
|
832 |
+
830 1
|
833 |
831 1
|
834 |
+
832 0
|
835 |
833 1
|
836 |
834 1
|
837 |
835 1
|
|
|
865 |
863 1
|
866 |
864 1
|
867 |
865 1
|
868 |
+
866 0
|
869 |
867 0
|
870 |
868 0
|
871 |
869 1
|
|
|
877 |
875 1
|
878 |
876 1
|
879 |
877 1
|
880 |
+
878 0
|
881 |
879 0
|
882 |
880 0
|
883 |
881 1
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 7964,
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second": 2.
|
8 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 3.0,
|
3 |
+
"train_loss": 0.5543336676785267,
|
4 |
+
"train_runtime": 347.758,
|
5 |
"train_samples": 7964,
|
6 |
+
"train_samples_per_second": 68.703,
|
7 |
+
"train_steps_per_second": 2.864
|
8 |
}
|
trainer_state.json
CHANGED
@@ -1,55 +1,70 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "models/spanish-offensive-language-bert-base-spanish-wwm-cased/checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
9 |
"log_history": [
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
-
"learning_rate":
|
13 |
-
"loss": 0.
|
14 |
"step": 332
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
-
"eval_f1": 0.
|
19 |
-
"eval_loss": 0.
|
20 |
-
"eval_runtime": 5.
|
21 |
-
"eval_samples_per_second":
|
22 |
-
"eval_steps_per_second": 7.
|
23 |
"step": 332
|
24 |
},
|
25 |
{
|
26 |
"epoch": 2.0,
|
27 |
-
"learning_rate":
|
28 |
-
"loss": 0.
|
29 |
"step": 664
|
30 |
},
|
31 |
{
|
32 |
"epoch": 2.0,
|
33 |
-
"eval_f1": 0.
|
34 |
-
"eval_loss": 0.
|
35 |
-
"eval_runtime": 5.
|
36 |
-
"eval_samples_per_second":
|
37 |
-
"eval_steps_per_second": 7.
|
38 |
"step": 664
|
39 |
},
|
40 |
{
|
41 |
-
"epoch":
|
42 |
-
"
|
43 |
-
"
|
44 |
-
"
|
45 |
-
|
46 |
-
|
47 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
48 |
}
|
49 |
],
|
50 |
-
"max_steps":
|
51 |
-
"num_train_epochs":
|
52 |
-
"total_flos":
|
53 |
"trial_name": null,
|
54 |
"trial_params": null
|
55 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.6014237329035705,
|
3 |
+
"best_model_checkpoint": "models/spanish-offensive-language-bert-base-spanish-wwm-cased/checkpoint-996",
|
4 |
+
"epoch": 3.0,
|
5 |
+
"global_step": 996,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
9 |
"log_history": [
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
+
"learning_rate": 1.3333333333333333e-05,
|
13 |
+
"loss": 0.6335,
|
14 |
"step": 332
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
+
"eval_f1": 0.5017770187437626,
|
19 |
+
"eval_loss": 0.6012123823165894,
|
20 |
+
"eval_runtime": 5.4247,
|
21 |
+
"eval_samples_per_second": 181.393,
|
22 |
+
"eval_steps_per_second": 7.558,
|
23 |
"step": 332
|
24 |
},
|
25 |
{
|
26 |
"epoch": 2.0,
|
27 |
+
"learning_rate": 6.666666666666667e-06,
|
28 |
+
"loss": 0.5659,
|
29 |
"step": 664
|
30 |
},
|
31 |
{
|
32 |
"epoch": 2.0,
|
33 |
+
"eval_f1": 0.5776452050829993,
|
34 |
+
"eval_loss": 0.5975989103317261,
|
35 |
+
"eval_runtime": 5.271,
|
36 |
+
"eval_samples_per_second": 186.682,
|
37 |
+
"eval_steps_per_second": 7.778,
|
38 |
"step": 664
|
39 |
},
|
40 |
{
|
41 |
+
"epoch": 3.0,
|
42 |
+
"learning_rate": 0.0,
|
43 |
+
"loss": 0.4636,
|
44 |
+
"step": 996
|
45 |
+
},
|
46 |
+
{
|
47 |
+
"epoch": 3.0,
|
48 |
+
"eval_f1": 0.6014237329035705,
|
49 |
+
"eval_loss": 0.6521763801574707,
|
50 |
+
"eval_runtime": 5.4331,
|
51 |
+
"eval_samples_per_second": 181.113,
|
52 |
+
"eval_steps_per_second": 7.546,
|
53 |
+
"step": 996
|
54 |
+
},
|
55 |
+
{
|
56 |
+
"epoch": 3.0,
|
57 |
+
"step": 996,
|
58 |
+
"total_flos": 6286249334661120.0,
|
59 |
+
"train_loss": 0.5543336676785267,
|
60 |
+
"train_runtime": 347.758,
|
61 |
+
"train_samples_per_second": 68.703,
|
62 |
+
"train_steps_per_second": 2.864
|
63 |
}
|
64 |
],
|
65 |
+
"max_steps": 996,
|
66 |
+
"num_train_epochs": 3,
|
67 |
+
"total_flos": 6286249334661120.0,
|
68 |
"trial_name": null,
|
69 |
"trial_params": null
|
70 |
}
|