File size: 78,168 Bytes
2a9ad6d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 |
[01:32:30] INFO - Epoch 1/50, Iter 0: Loss = 1.0565705299377441, lr = 0.0001
[01:33:06] INFO - Epoch 1/50, Iter 100: Loss = 0.052893124520778656, lr = 0.0001
[01:33:43] INFO - Epoch 1/50, Iter 200: Loss = 0.06410080194473267, lr = 0.0001
[01:34:20] INFO - Epoch 1/50, Iter 300: Loss = 0.036012835800647736, lr = 0.0001
[01:34:57] INFO - Epoch 1/50, Iter 400: Loss = 0.04257039353251457, lr = 0.0001
[01:35:35] INFO - Epoch 1/50, Iter 500: Loss = 0.04468406364321709, lr = 0.0001
[01:36:12] INFO - Epoch 1/50, Iter 600: Loss = 0.031456008553504944, lr = 0.0001
[01:36:49] INFO - Epoch 1/50, Iter 700: Loss = 0.03800628334283829, lr = 0.0001
[01:37:26] INFO - Epoch 1/50, Iter 800: Loss = 0.05088917911052704, lr = 0.0001
[01:38:04] INFO - Epoch 1/50, Iter 900: Loss = 0.04832298308610916, lr = 0.0001
[01:39:47] INFO - Epoch 1/50, Iter 1000: Loss = 0.021001430228352547, lr = 0.0001
[01:40:23] INFO - Epoch 1/50, Iter 1100: Loss = 0.027549631893634796, lr = 0.0001
[01:41:01] INFO - Epoch 1/50, Iter 1200: Loss = 0.026023169979453087, lr = 0.0001
[01:41:39] INFO - Epoch 1/50, Iter 1300: Loss = 0.019382692873477936, lr = 0.0001
[01:42:17] INFO - Epoch 1/50, Iter 1400: Loss = 0.018007593229413033, lr = 0.0001
[01:42:54] INFO - Epoch 1/50, Iter 1500: Loss = 0.029549293220043182, lr = 0.0001
[01:43:31] INFO - Epoch 1/50, Iter 1600: Loss = 0.033689916133880615, lr = 0.0001
[01:44:09] INFO - Epoch 1/50, Iter 1700: Loss = 0.027298524975776672, lr = 0.0001
[01:44:46] INFO - Epoch 1/50, Iter 1800: Loss = 0.035250209271907806, lr = 0.0001
[01:45:24] INFO - Epoch 2/50, Iter 1900: Loss = 0.03265728801488876, lr = 0.0001
[01:47:08] INFO - Epoch 2/50, Iter 2000: Loss = 0.017500419169664383, lr = 0.0001
[01:47:43] INFO - Epoch 2/50, Iter 2100: Loss = 0.022061176598072052, lr = 0.0001
[01:48:20] INFO - Epoch 2/50, Iter 2200: Loss = 0.031774356961250305, lr = 0.0001
[01:48:57] INFO - Epoch 2/50, Iter 2300: Loss = 0.027994144707918167, lr = 0.0001
[01:49:34] INFO - Epoch 2/50, Iter 2400: Loss = 0.021347511559724808, lr = 0.0001
[01:50:12] INFO - Epoch 2/50, Iter 2500: Loss = 0.03212534263730049, lr = 0.0001
[01:50:49] INFO - Epoch 2/50, Iter 2600: Loss = 0.03436075150966644, lr = 0.0001
[01:51:26] INFO - Epoch 2/50, Iter 2700: Loss = 0.039760299026966095, lr = 0.0001
[01:52:03] INFO - Epoch 2/50, Iter 2800: Loss = 0.018602240830659866, lr = 0.0001
[01:52:41] INFO - Epoch 2/50, Iter 2900: Loss = 0.017089033499360085, lr = 0.0001
[01:54:27] INFO - Epoch 2/50, Iter 3000: Loss = 0.01724972389638424, lr = 0.0001
[01:55:02] INFO - Epoch 2/50, Iter 3100: Loss = 0.02486235462129116, lr = 0.0001
[01:55:37] INFO - Epoch 2/50, Iter 3200: Loss = 0.022042328491806984, lr = 0.0001
[01:56:15] INFO - Epoch 2/50, Iter 3300: Loss = 0.026623308658599854, lr = 0.0001
[01:56:52] INFO - Epoch 2/50, Iter 3400: Loss = 0.02405683323740959, lr = 0.0001
[01:57:30] INFO - Epoch 2/50, Iter 3500: Loss = 0.018972214311361313, lr = 0.0001
[01:58:07] INFO - Epoch 2/50, Iter 3600: Loss = 0.021761640906333923, lr = 0.0001
[01:58:44] INFO - Epoch 2/50, Iter 3700: Loss = 0.023115914314985275, lr = 0.0001
[01:59:23] INFO - Epoch 3/50, Iter 3800: Loss = 0.022612307220697403, lr = 0.0001
[02:00:01] INFO - Epoch 3/50, Iter 3900: Loss = 0.017524931579828262, lr = 0.0001
[02:01:47] INFO - Epoch 3/50, Iter 4000: Loss = 0.01466086134314537, lr = 0.0001
[02:02:22] INFO - Epoch 3/50, Iter 4100: Loss = 0.031845346093177795, lr = 0.0001
[02:02:57] INFO - Epoch 3/50, Iter 4200: Loss = 0.0237705297768116, lr = 0.0001
[02:03:33] INFO - Epoch 3/50, Iter 4300: Loss = 0.0320965051651001, lr = 0.0001
[02:04:11] INFO - Epoch 3/50, Iter 4400: Loss = 0.023783233016729355, lr = 0.0001
[02:04:48] INFO - Epoch 3/50, Iter 4500: Loss = 0.022754667326807976, lr = 0.0001
[02:05:25] INFO - Epoch 3/50, Iter 4600: Loss = 0.030830159783363342, lr = 0.0001
[02:06:03] INFO - Epoch 3/50, Iter 4700: Loss = 0.025824744254350662, lr = 0.0001
[02:06:40] INFO - Epoch 3/50, Iter 4800: Loss = 0.019503239542245865, lr = 0.0001
[02:07:18] INFO - Epoch 3/50, Iter 4900: Loss = 0.021452341228723526, lr = 0.0001
[02:09:05] INFO - Epoch 3/50, Iter 5000: Loss = 0.026259608566761017, lr = 0.0001
[02:09:42] INFO - Epoch 3/50, Iter 5100: Loss = 0.023281030356884003, lr = 0.0001
[02:10:17] INFO - Epoch 3/50, Iter 5200: Loss = 0.020111314952373505, lr = 0.0001
[02:10:52] INFO - Epoch 3/50, Iter 5300: Loss = 0.019614871591329575, lr = 0.0001
[02:11:29] INFO - Epoch 3/50, Iter 5400: Loss = 0.014699136838316917, lr = 0.0001
[02:12:06] INFO - Epoch 3/50, Iter 5500: Loss = 0.021856755018234253, lr = 0.0001
[02:12:44] INFO - Epoch 3/50, Iter 5600: Loss = 0.023845821619033813, lr = 0.0001
[02:13:22] INFO - Epoch 4/50, Iter 5700: Loss = 0.03385388106107712, lr = 0.0001
[02:14:00] INFO - Epoch 4/50, Iter 5800: Loss = 0.03092341311275959, lr = 0.0001
[02:14:38] INFO - Epoch 4/50, Iter 5900: Loss = 0.02334553748369217, lr = 0.0001
[02:16:24] INFO - Epoch 4/50, Iter 6000: Loss = 0.042254190891981125, lr = 0.0001
[02:17:01] INFO - Epoch 4/50, Iter 6100: Loss = 0.026709988713264465, lr = 0.0001
[02:17:37] INFO - Epoch 4/50, Iter 6200: Loss = 0.026842636987566948, lr = 0.0001
[02:18:12] INFO - Epoch 4/50, Iter 6300: Loss = 0.02040724828839302, lr = 0.0001
[02:18:47] INFO - Epoch 4/50, Iter 6400: Loss = 0.03485984355211258, lr = 0.0001
[02:19:24] INFO - Epoch 4/50, Iter 6500: Loss = 0.01901041902601719, lr = 0.0001
[02:20:02] INFO - Epoch 4/50, Iter 6600: Loss = 0.0252228956669569, lr = 0.0001
[02:20:39] INFO - Epoch 4/50, Iter 6700: Loss = 0.022261066362261772, lr = 0.0001
[02:21:17] INFO - Epoch 4/50, Iter 6800: Loss = 0.024207420647144318, lr = 0.0001
[02:21:54] INFO - Epoch 4/50, Iter 6900: Loss = 0.02730383910238743, lr = 0.0001
[02:23:42] INFO - Epoch 4/50, Iter 7000: Loss = 0.030614979565143585, lr = 0.0001
[02:24:19] INFO - Epoch 4/50, Iter 7100: Loss = 0.009843399748206139, lr = 0.0001
[02:24:56] INFO - Epoch 4/50, Iter 7200: Loss = 0.030504770576953888, lr = 0.0001
[02:25:31] INFO - Epoch 4/50, Iter 7300: Loss = 0.019922511652112007, lr = 0.0001
[02:26:06] INFO - Epoch 4/50, Iter 7400: Loss = 0.017346005886793137, lr = 0.0001
[02:26:43] INFO - Epoch 5/50, Iter 7500: Loss = 0.04261239618062973, lr = 0.0001
[02:27:21] INFO - Epoch 5/50, Iter 7600: Loss = 0.01848176121711731, lr = 0.0001
[02:27:59] INFO - Epoch 5/50, Iter 7700: Loss = 0.02630079910159111, lr = 0.0001
[02:28:38] INFO - Epoch 5/50, Iter 7800: Loss = 0.017152022570371628, lr = 0.0001
[02:29:16] INFO - Epoch 5/50, Iter 7900: Loss = 0.019739195704460144, lr = 0.0001
[02:31:02] INFO - Epoch 5/50, Iter 8000: Loss = 0.035217173397541046, lr = 0.0001
[02:31:38] INFO - Epoch 5/50, Iter 8100: Loss = 0.024997148662805557, lr = 0.0001
[02:32:15] INFO - Epoch 5/50, Iter 8200: Loss = 0.01869952492415905, lr = 0.0001
[02:32:51] INFO - Epoch 5/50, Iter 8300: Loss = 0.022771766409277916, lr = 0.0001
[02:33:26] INFO - Epoch 5/50, Iter 8400: Loss = 0.021768197417259216, lr = 0.0001
[02:34:01] INFO - Epoch 5/50, Iter 8500: Loss = 0.02135184407234192, lr = 0.0001
[02:34:38] INFO - Epoch 5/50, Iter 8600: Loss = 0.025887122377753258, lr = 0.0001
[02:35:16] INFO - Epoch 5/50, Iter 8700: Loss = 0.020226851105690002, lr = 0.0001
[02:35:53] INFO - Epoch 5/50, Iter 8800: Loss = 0.0163625106215477, lr = 0.0001
[02:36:31] INFO - Epoch 5/50, Iter 8900: Loss = 0.033197011798620224, lr = 0.0001
[02:38:18] INFO - Epoch 5/50, Iter 9000: Loss = 0.018169889226555824, lr = 0.0001
[02:38:56] INFO - Epoch 5/50, Iter 9100: Loss = 0.01835501380264759, lr = 0.0001
[02:39:33] INFO - Epoch 5/50, Iter 9200: Loss = 0.018355708569288254, lr = 0.0001
[02:40:11] INFO - Epoch 5/50, Iter 9300: Loss = 0.02957603707909584, lr = 0.0001
[02:40:47] INFO - Epoch 6/50, Iter 9400: Loss = 0.02988416701555252, lr = 0.0001
[02:41:22] INFO - Epoch 6/50, Iter 9500: Loss = 0.029050955548882484, lr = 0.0001
[02:41:59] INFO - Epoch 6/50, Iter 9600: Loss = 0.029915111139416695, lr = 0.0001
[02:42:37] INFO - Epoch 6/50, Iter 9700: Loss = 0.032014522701501846, lr = 0.0001
[02:43:15] INFO - Epoch 6/50, Iter 9800: Loss = 0.02710639499127865, lr = 0.0001
[02:43:53] INFO - Epoch 6/50, Iter 9900: Loss = 0.02623252011835575, lr = 0.0001
[02:45:39] INFO - Epoch 6/50, Iter 10000: Loss = 0.018064428120851517, lr = 0.0001
[02:46:16] INFO - Epoch 6/50, Iter 10100: Loss = 0.017915505915880203, lr = 0.0001
[02:46:52] INFO - Epoch 6/50, Iter 10200: Loss = 0.018055936321616173, lr = 0.0001
[02:47:29] INFO - Epoch 6/50, Iter 10300: Loss = 0.02242400124669075, lr = 0.0001
[02:48:06] INFO - Epoch 6/50, Iter 10400: Loss = 0.016980063170194626, lr = 0.0001
[02:48:41] INFO - Epoch 6/50, Iter 10500: Loss = 0.028786756098270416, lr = 0.0001
[02:49:15] INFO - Epoch 6/50, Iter 10600: Loss = 0.0259169340133667, lr = 0.0001
[02:49:52] INFO - Epoch 6/50, Iter 10700: Loss = 0.02411068230867386, lr = 0.0001
[02:50:30] INFO - Epoch 6/50, Iter 10800: Loss = 0.028709815815091133, lr = 0.0001
[02:51:07] INFO - Epoch 6/50, Iter 10900: Loss = 0.023950304836034775, lr = 0.0001
[02:52:55] INFO - Epoch 6/50, Iter 11000: Loss = 0.01635728031396866, lr = 0.0001
[02:53:32] INFO - Epoch 6/50, Iter 11100: Loss = 0.021019836887717247, lr = 0.0001
[02:54:09] INFO - Epoch 6/50, Iter 11200: Loss = 0.03072471171617508, lr = 0.0001
[02:54:48] INFO - Epoch 7/50, Iter 11300: Loss = 0.017645131796598434, lr = 0.0001
[02:55:26] INFO - Epoch 7/50, Iter 11400: Loss = 0.03241223841905594, lr = 0.0001
[02:56:02] INFO - Epoch 7/50, Iter 11500: Loss = 0.023425636813044548, lr = 0.0001
[02:56:38] INFO - Epoch 7/50, Iter 11600: Loss = 0.028445253148674965, lr = 0.0001
[02:57:14] INFO - Epoch 7/50, Iter 11700: Loss = 0.021178875118494034, lr = 0.0001
[02:57:52] INFO - Epoch 7/50, Iter 11800: Loss = 0.025874968618154526, lr = 0.0001
[02:58:30] INFO - Epoch 7/50, Iter 11900: Loss = 0.02024815045297146, lr = 0.0001
[03:00:16] INFO - Epoch 7/50, Iter 12000: Loss = 0.017120303586125374, lr = 0.0001
[03:00:53] INFO - Epoch 7/50, Iter 12100: Loss = 0.029735827818512917, lr = 0.0001
[03:01:29] INFO - Epoch 7/50, Iter 12200: Loss = 0.035674042999744415, lr = 0.0001
[03:02:06] INFO - Epoch 7/50, Iter 12300: Loss = 0.036703627556562424, lr = 0.0001
[03:02:43] INFO - Epoch 7/50, Iter 12400: Loss = 0.02421719767153263, lr = 0.0001
[03:03:20] INFO - Epoch 7/50, Iter 12500: Loss = 0.018868938088417053, lr = 0.0001
[03:03:55] INFO - Epoch 7/50, Iter 12600: Loss = 0.02622353658080101, lr = 0.0001
[03:04:30] INFO - Epoch 7/50, Iter 12700: Loss = 0.01901184767484665, lr = 0.0001
[03:05:06] INFO - Epoch 7/50, Iter 12800: Loss = 0.020489446818828583, lr = 0.0001
[03:05:44] INFO - Epoch 7/50, Iter 12900: Loss = 0.032885171473026276, lr = 0.0001
[03:07:31] INFO - Epoch 7/50, Iter 13000: Loss = 0.022485921159386635, lr = 0.0001
[03:08:08] INFO - Epoch 7/50, Iter 13100: Loss = 0.01670442707836628, lr = 0.0001
[03:08:47] INFO - Epoch 8/50, Iter 13200: Loss = 0.02743910253047943, lr = 0.0001
[03:09:25] INFO - Epoch 8/50, Iter 13300: Loss = 0.018927330151200294, lr = 0.0001
[03:10:03] INFO - Epoch 8/50, Iter 13400: Loss = 0.02689310908317566, lr = 0.0001
[03:10:41] INFO - Epoch 8/50, Iter 13500: Loss = 0.0141057800501585, lr = 0.0001
[03:11:18] INFO - Epoch 8/50, Iter 13600: Loss = 0.028984226286411285, lr = 0.0001
[03:11:53] INFO - Epoch 8/50, Iter 13700: Loss = 0.029749657958745956, lr = 0.0001
[03:12:29] INFO - Epoch 8/50, Iter 13800: Loss = 0.015233050100505352, lr = 0.0001
[03:13:07] INFO - Epoch 8/50, Iter 13900: Loss = 0.0163307785987854, lr = 0.0001
[03:14:53] INFO - Epoch 8/50, Iter 14000: Loss = 0.02872077375650406, lr = 0.0001
[03:15:30] INFO - Epoch 8/50, Iter 14100: Loss = 0.02807019278407097, lr = 0.0001
[03:16:07] INFO - Epoch 8/50, Iter 14200: Loss = 0.03054160065948963, lr = 0.0001
[03:16:43] INFO - Epoch 8/50, Iter 14300: Loss = 0.02313782460987568, lr = 0.0001
[03:17:20] INFO - Epoch 8/50, Iter 14400: Loss = 0.025084566324949265, lr = 0.0001
[03:17:57] INFO - Epoch 8/50, Iter 14500: Loss = 0.02139408141374588, lr = 0.0001
[03:18:34] INFO - Epoch 8/50, Iter 14600: Loss = 0.021309100091457367, lr = 0.0001
[03:19:10] INFO - Epoch 8/50, Iter 14700: Loss = 0.021668197587132454, lr = 0.0001
[03:19:44] INFO - Epoch 8/50, Iter 14800: Loss = 0.027393829077482224, lr = 0.0001
[03:20:20] INFO - Epoch 8/50, Iter 14900: Loss = 0.021895278245210648, lr = 0.0001
[03:22:08] INFO - Epoch 9/50, Iter 15000: Loss = 0.021187055855989456, lr = 0.0001
[03:22:46] INFO - Epoch 9/50, Iter 15100: Loss = 0.02533610723912716, lr = 0.0001
[03:23:24] INFO - Epoch 9/50, Iter 15200: Loss = 0.013163303956389427, lr = 0.0001
[03:24:02] INFO - Epoch 9/50, Iter 15300: Loss = 0.0278776828199625, lr = 0.0001
[03:24:40] INFO - Epoch 9/50, Iter 15400: Loss = 0.02406580187380314, lr = 0.0001
[03:25:19] INFO - Epoch 9/50, Iter 15500: Loss = 0.03571601212024689, lr = 0.0001
[03:25:57] INFO - Epoch 9/50, Iter 15600: Loss = 0.0257314071059227, lr = 0.0001
[03:26:34] INFO - Epoch 9/50, Iter 15700: Loss = 0.01789958029985428, lr = 0.0001
[03:27:10] INFO - Epoch 9/50, Iter 15800: Loss = 0.022831305861473083, lr = 0.0001
[03:27:44] INFO - Epoch 9/50, Iter 15900: Loss = 0.02363549917936325, lr = 0.0001
[03:29:31] INFO - Epoch 9/50, Iter 16000: Loss = 0.01978084072470665, lr = 0.0001
[03:30:08] INFO - Epoch 9/50, Iter 16100: Loss = 0.022113677114248276, lr = 0.0001
[03:30:44] INFO - Epoch 9/50, Iter 16200: Loss = 0.024963347241282463, lr = 0.0001
[03:31:21] INFO - Epoch 9/50, Iter 16300: Loss = 0.013087751343846321, lr = 0.0001
[03:31:58] INFO - Epoch 9/50, Iter 16400: Loss = 0.020678795874118805, lr = 0.0001
[03:32:35] INFO - Epoch 9/50, Iter 16500: Loss = 0.020716585218906403, lr = 0.0001
[03:33:12] INFO - Epoch 9/50, Iter 16600: Loss = 0.015427518635988235, lr = 0.0001
[03:33:48] INFO - Epoch 9/50, Iter 16700: Loss = 0.021022498607635498, lr = 0.0001
[03:34:25] INFO - Epoch 9/50, Iter 16800: Loss = 0.01959395967423916, lr = 0.0001
[03:35:00] INFO - Epoch 10/50, Iter 16900: Loss = 0.032150253653526306, lr = 0.0001
[03:36:46] INFO - Epoch 10/50, Iter 17000: Loss = 0.01854921132326126, lr = 0.0001
[03:37:23] INFO - Epoch 10/50, Iter 17100: Loss = 0.02160738781094551, lr = 0.0001
[03:38:01] INFO - Epoch 10/50, Iter 17200: Loss = 0.015743758529424667, lr = 0.0001
[03:38:38] INFO - Epoch 10/50, Iter 17300: Loss = 0.026099730283021927, lr = 0.0001
[03:39:15] INFO - Epoch 10/50, Iter 17400: Loss = 0.033034007996320724, lr = 0.0001
[03:39:53] INFO - Epoch 10/50, Iter 17500: Loss = 0.01821458525955677, lr = 0.0001
[03:40:30] INFO - Epoch 10/50, Iter 17600: Loss = 0.022443238645792007, lr = 0.0001
[03:41:07] INFO - Epoch 10/50, Iter 17700: Loss = 0.01728179305791855, lr = 0.0001
[03:41:44] INFO - Epoch 10/50, Iter 17800: Loss = 0.031235814094543457, lr = 0.0001
[03:42:19] INFO - Epoch 10/50, Iter 17900: Loss = 0.034977469593286514, lr = 0.0001
[03:44:03] INFO - Epoch 10/50, Iter 18000: Loss = 0.02534203603863716, lr = 0.0001
[03:44:40] INFO - Epoch 10/50, Iter 18100: Loss = 0.022452227771282196, lr = 0.0001
[03:45:18] INFO - Epoch 10/50, Iter 18200: Loss = 0.017300918698310852, lr = 0.0001
[03:45:55] INFO - Epoch 10/50, Iter 18300: Loss = 0.027169708162546158, lr = 0.0001
[03:46:33] INFO - Epoch 10/50, Iter 18400: Loss = 0.015911249443888664, lr = 0.0001
[03:47:10] INFO - Epoch 10/50, Iter 18500: Loss = 0.01670893095433712, lr = 0.0001
[03:47:48] INFO - Epoch 10/50, Iter 18600: Loss = 0.022836333140730858, lr = 0.0001
[03:48:25] INFO - Epoch 10/50, Iter 18700: Loss = 0.019568461924791336, lr = 0.0001
[03:49:03] INFO - Epoch 11/50, Iter 18800: Loss = 0.020943816751241684, lr = 0.0001
[03:49:41] INFO - Epoch 11/50, Iter 18900: Loss = 0.028032630681991577, lr = 0.0001
[03:51:24] INFO - Epoch 11/50, Iter 19000: Loss = 0.015449410304427147, lr = 0.0001
[03:52:02] INFO - Epoch 11/50, Iter 19100: Loss = 0.028382163494825363, lr = 0.0001
[03:52:39] INFO - Epoch 11/50, Iter 19200: Loss = 0.03230266273021698, lr = 0.0001
[03:53:16] INFO - Epoch 11/50, Iter 19300: Loss = 0.021432269364595413, lr = 0.0001
[03:53:54] INFO - Epoch 11/50, Iter 19400: Loss = 0.021147528663277626, lr = 0.0001
[03:54:31] INFO - Epoch 11/50, Iter 19500: Loss = 0.014547022059559822, lr = 0.0001
[03:55:09] INFO - Epoch 11/50, Iter 19600: Loss = 0.030874505639076233, lr = 0.0001
[03:55:45] INFO - Epoch 11/50, Iter 19700: Loss = 0.020982904359698296, lr = 0.0001
[03:56:22] INFO - Epoch 11/50, Iter 19800: Loss = 0.023455671966075897, lr = 0.0001
[03:56:59] INFO - Epoch 11/50, Iter 19900: Loss = 0.024504322558641434, lr = 0.0001
[03:58:41] INFO - Epoch 11/50, Iter 20000: Loss = 0.018932566046714783, lr = 0.0001
[03:59:18] INFO - Epoch 11/50, Iter 20100: Loss = 0.02632874995470047, lr = 0.0001
[03:59:56] INFO - Epoch 11/50, Iter 20200: Loss = 0.029866697266697884, lr = 0.0001
[04:00:33] INFO - Epoch 11/50, Iter 20300: Loss = 0.031086044386029243, lr = 0.0001
[04:01:10] INFO - Epoch 11/50, Iter 20400: Loss = 0.02815106511116028, lr = 0.0001
[04:01:48] INFO - Epoch 11/50, Iter 20500: Loss = 0.02130046673119068, lr = 0.0001
[04:02:25] INFO - Epoch 11/50, Iter 20600: Loss = 0.023784568533301353, lr = 0.0001
[04:03:04] INFO - Epoch 12/50, Iter 20700: Loss = 0.026831526309251785, lr = 0.0001
[04:03:42] INFO - Epoch 12/50, Iter 20800: Loss = 0.022841420024633408, lr = 0.0001
[04:04:20] INFO - Epoch 12/50, Iter 20900: Loss = 0.017967013642191887, lr = 0.0001
[04:06:03] INFO - Epoch 12/50, Iter 21000: Loss = 0.023366201668977737, lr = 0.0001
[04:06:40] INFO - Epoch 12/50, Iter 21100: Loss = 0.011247624643146992, lr = 0.0001
[04:07:18] INFO - Epoch 12/50, Iter 21200: Loss = 0.017998967319726944, lr = 0.0001
[04:07:55] INFO - Epoch 12/50, Iter 21300: Loss = 0.01666315086185932, lr = 0.0001
[04:08:32] INFO - Epoch 12/50, Iter 21400: Loss = 0.027271557599306107, lr = 0.0001
[04:09:10] INFO - Epoch 12/50, Iter 21500: Loss = 0.04178820922970772, lr = 0.0001
[04:09:47] INFO - Epoch 12/50, Iter 21600: Loss = 0.022403031587600708, lr = 0.0001
[04:10:24] INFO - Epoch 12/50, Iter 21700: Loss = 0.018806155771017075, lr = 0.0001
[04:11:01] INFO - Epoch 12/50, Iter 21800: Loss = 0.02545701339840889, lr = 0.0001
[04:11:37] INFO - Epoch 12/50, Iter 21900: Loss = 0.01953921467065811, lr = 0.0001
[04:13:20] INFO - Epoch 12/50, Iter 22000: Loss = 0.01733117178082466, lr = 0.0001
[04:13:56] INFO - Epoch 12/50, Iter 22100: Loss = 0.025370147079229355, lr = 0.0001
[04:14:33] INFO - Epoch 12/50, Iter 22200: Loss = 0.018694361671805382, lr = 0.0001
[04:15:11] INFO - Epoch 12/50, Iter 22300: Loss = 0.02715042605996132, lr = 0.0001
[04:15:48] INFO - Epoch 12/50, Iter 22400: Loss = 0.025544647127389908, lr = 0.0001
[04:16:26] INFO - Epoch 13/50, Iter 22500: Loss = 0.019888730719685555, lr = 0.0001
[04:17:04] INFO - Epoch 13/50, Iter 22600: Loss = 0.021217184141278267, lr = 0.0001
[04:17:42] INFO - Epoch 13/50, Iter 22700: Loss = 0.022269055247306824, lr = 0.0001
[04:18:20] INFO - Epoch 13/50, Iter 22800: Loss = 0.01928224414587021, lr = 0.0001
[04:18:58] INFO - Epoch 13/50, Iter 22900: Loss = 0.015648994594812393, lr = 0.0001
[04:20:44] INFO - Epoch 13/50, Iter 23000: Loss = 0.017691921442747116, lr = 0.0001
[04:21:19] INFO - Epoch 13/50, Iter 23100: Loss = 0.017905689775943756, lr = 0.0001
[04:21:56] INFO - Epoch 13/50, Iter 23200: Loss = 0.02446005865931511, lr = 0.0001
[04:22:33] INFO - Epoch 13/50, Iter 23300: Loss = 0.012783464044332504, lr = 0.0001
[04:23:11] INFO - Epoch 13/50, Iter 23400: Loss = 0.021168000996112823, lr = 0.0001
[04:23:48] INFO - Epoch 13/50, Iter 23500: Loss = 0.021574562415480614, lr = 0.0001
[04:24:25] INFO - Epoch 13/50, Iter 23600: Loss = 0.014954578131437302, lr = 0.0001
[04:25:02] INFO - Epoch 13/50, Iter 23700: Loss = 0.024804923683404922, lr = 0.0001
[04:25:39] INFO - Epoch 13/50, Iter 23800: Loss = 0.022417966276407242, lr = 0.0001
[04:26:15] INFO - Epoch 13/50, Iter 23900: Loss = 0.024885393679142, lr = 0.0001
[04:28:01] INFO - Epoch 13/50, Iter 24000: Loss = 0.01513182558119297, lr = 0.0001
[04:28:35] INFO - Epoch 13/50, Iter 24100: Loss = 0.03394199162721634, lr = 0.0001
[04:29:10] INFO - Epoch 13/50, Iter 24200: Loss = 0.01728047989308834, lr = 0.0001
[04:29:48] INFO - Epoch 13/50, Iter 24300: Loss = 0.021687734872102737, lr = 0.0001
[04:30:26] INFO - Epoch 14/50, Iter 24400: Loss = 0.021854422986507416, lr = 0.0001
[04:31:04] INFO - Epoch 14/50, Iter 24500: Loss = 0.01786675862967968, lr = 0.0001
[04:31:42] INFO - Epoch 14/50, Iter 24600: Loss = 0.013988310471177101, lr = 0.0001
[04:32:20] INFO - Epoch 14/50, Iter 24700: Loss = 0.027566110715270042, lr = 0.0001
[04:32:58] INFO - Epoch 14/50, Iter 24800: Loss = 0.026513565331697464, lr = 0.0001
[04:33:36] INFO - Epoch 14/50, Iter 24900: Loss = 0.03264237195253372, lr = 0.0001
[04:35:25] INFO - Epoch 14/50, Iter 25000: Loss = 0.01717931032180786, lr = 0.0001
[04:36:00] INFO - Epoch 14/50, Iter 25100: Loss = 0.023670285940170288, lr = 0.0001
[04:36:35] INFO - Epoch 14/50, Iter 25200: Loss = 0.024744831025600433, lr = 0.0001
[04:37:11] INFO - Epoch 14/50, Iter 25300: Loss = 0.024575743824243546, lr = 0.0001
[04:37:49] INFO - Epoch 14/50, Iter 25400: Loss = 0.026712141931056976, lr = 0.0001
[04:38:26] INFO - Epoch 14/50, Iter 25500: Loss = 0.024456407874822617, lr = 0.0001
[04:39:04] INFO - Epoch 14/50, Iter 25600: Loss = 0.02141718566417694, lr = 0.0001
[04:39:40] INFO - Epoch 14/50, Iter 25700: Loss = 0.029445897787809372, lr = 0.0001
[04:40:17] INFO - Epoch 14/50, Iter 25800: Loss = 0.02473919466137886, lr = 0.0001
[04:40:54] INFO - Epoch 14/50, Iter 25900: Loss = 0.0274130180478096, lr = 0.0001
[04:42:39] INFO - Epoch 14/50, Iter 26000: Loss = 0.018764521926641464, lr = 0.0001
[04:43:16] INFO - Epoch 14/50, Iter 26100: Loss = 0.02663726732134819, lr = 0.0001
[04:43:51] INFO - Epoch 14/50, Iter 26200: Loss = 0.024019204080104828, lr = 0.0001
[04:44:27] INFO - Epoch 15/50, Iter 26300: Loss = 0.02434862032532692, lr = 0.0001
[04:45:04] INFO - Epoch 15/50, Iter 26400: Loss = 0.019603703171014786, lr = 0.0001
[04:45:42] INFO - Epoch 15/50, Iter 26500: Loss = 0.02259880304336548, lr = 0.0001
[04:46:20] INFO - Epoch 15/50, Iter 26600: Loss = 0.0331149660050869, lr = 0.0001
[04:46:58] INFO - Epoch 15/50, Iter 26700: Loss = 0.026867881417274475, lr = 0.0001
[04:47:36] INFO - Epoch 15/50, Iter 26800: Loss = 0.024988386780023575, lr = 0.0001
[04:48:14] INFO - Epoch 15/50, Iter 26900: Loss = 0.02191883698105812, lr = 0.0001
[04:50:03] INFO - Epoch 15/50, Iter 27000: Loss = 0.02334633283317089, lr = 0.0001
[04:50:40] INFO - Epoch 15/50, Iter 27100: Loss = 0.037146203219890594, lr = 0.0001
[04:51:16] INFO - Epoch 15/50, Iter 27200: Loss = 0.02440967783331871, lr = 0.0001
[04:51:51] INFO - Epoch 15/50, Iter 27300: Loss = 0.01723914034664631, lr = 0.0001
[04:52:26] INFO - Epoch 15/50, Iter 27400: Loss = 0.018244989216327667, lr = 0.0001
[04:53:04] INFO - Epoch 15/50, Iter 27500: Loss = 0.027221685275435448, lr = 0.0001
[04:53:41] INFO - Epoch 15/50, Iter 27600: Loss = 0.031127087771892548, lr = 0.0001
[04:54:18] INFO - Epoch 15/50, Iter 27700: Loss = 0.030011950060725212, lr = 0.0001
[04:54:54] INFO - Epoch 15/50, Iter 27800: Loss = 0.026527389883995056, lr = 0.0001
[04:55:31] INFO - Epoch 15/50, Iter 27900: Loss = 0.01575150154531002, lr = 0.0001
[04:57:17] INFO - Epoch 15/50, Iter 28000: Loss = 0.021047182381153107, lr = 0.0001
[04:57:54] INFO - Epoch 15/50, Iter 28100: Loss = 0.019234780222177505, lr = 0.0001
[04:58:32] INFO - Epoch 16/50, Iter 28200: Loss = 0.020383525639772415, lr = 0.0001
[04:59:07] INFO - Epoch 16/50, Iter 28300: Loss = 0.016444209963083267, lr = 0.0001
[04:59:43] INFO - Epoch 16/50, Iter 28400: Loss = 0.018604744225740433, lr = 0.0001
[05:00:20] INFO - Epoch 16/50, Iter 28500: Loss = 0.019427413120865822, lr = 0.0001
[05:00:58] INFO - Epoch 16/50, Iter 28600: Loss = 0.017774565145373344, lr = 0.0001
[05:01:36] INFO - Epoch 16/50, Iter 28700: Loss = 0.023675590753555298, lr = 0.0001
[05:02:14] INFO - Epoch 16/50, Iter 28800: Loss = 0.020861458033323288, lr = 0.0001
[05:02:52] INFO - Epoch 16/50, Iter 28900: Loss = 0.018384676426649094, lr = 0.0001
[05:04:40] INFO - Epoch 16/50, Iter 29000: Loss = 0.016222134232521057, lr = 0.0001
[05:05:18] INFO - Epoch 16/50, Iter 29100: Loss = 0.028459617868065834, lr = 0.0001
[05:05:55] INFO - Epoch 16/50, Iter 29200: Loss = 0.01797397807240486, lr = 0.0001
[05:06:32] INFO - Epoch 16/50, Iter 29300: Loss = 0.017931153997778893, lr = 0.0001
[05:07:06] INFO - Epoch 16/50, Iter 29400: Loss = 0.02121908590197563, lr = 0.0001
[05:07:42] INFO - Epoch 16/50, Iter 29500: Loss = 0.013189872726798058, lr = 0.0001
[05:08:19] INFO - Epoch 16/50, Iter 29600: Loss = 0.03299304470419884, lr = 0.0001
[05:08:55] INFO - Epoch 16/50, Iter 29700: Loss = 0.02376321330666542, lr = 0.0001
[05:09:32] INFO - Epoch 16/50, Iter 29800: Loss = 0.019566014409065247, lr = 0.0001
[05:10:09] INFO - Epoch 16/50, Iter 29900: Loss = 0.03177930414676666, lr = 0.0001
[05:11:55] INFO - Epoch 17/50, Iter 30000: Loss = 0.02080521546304226, lr = 0.0001
[05:12:33] INFO - Epoch 17/50, Iter 30100: Loss = 0.015452045015990734, lr = 0.0001
[05:13:10] INFO - Epoch 17/50, Iter 30200: Loss = 0.015891047194600105, lr = 0.0001
[05:13:48] INFO - Epoch 17/50, Iter 30300: Loss = 0.026789262890815735, lr = 0.0001
[05:14:24] INFO - Epoch 17/50, Iter 30400: Loss = 0.019903719425201416, lr = 0.0001
[05:14:59] INFO - Epoch 17/50, Iter 30500: Loss = 0.019173964858055115, lr = 0.0001
[05:15:36] INFO - Epoch 17/50, Iter 30600: Loss = 0.022256750613451004, lr = 0.0001
[05:16:14] INFO - Epoch 17/50, Iter 30700: Loss = 0.02445339225232601, lr = 0.0001
[05:16:52] INFO - Epoch 17/50, Iter 30800: Loss = 0.024548256769776344, lr = 0.0001
[05:17:30] INFO - Epoch 17/50, Iter 30900: Loss = 0.02155543863773346, lr = 0.0001
[05:19:18] INFO - Epoch 17/50, Iter 31000: Loss = 0.021055273711681366, lr = 0.0001
[05:19:56] INFO - Epoch 17/50, Iter 31100: Loss = 0.020960915833711624, lr = 0.0001
[05:20:33] INFO - Epoch 17/50, Iter 31200: Loss = 0.025311872363090515, lr = 0.0001
[05:21:11] INFO - Epoch 17/50, Iter 31300: Loss = 0.019544431939721107, lr = 0.0001
[05:21:48] INFO - Epoch 17/50, Iter 31400: Loss = 0.01915333792567253, lr = 0.0001
[05:22:22] INFO - Epoch 17/50, Iter 31500: Loss = 0.03003186732530594, lr = 0.0001
[05:22:56] INFO - Epoch 17/50, Iter 31600: Loss = 0.02915569767355919, lr = 0.0001
[05:23:33] INFO - Epoch 17/50, Iter 31700: Loss = 0.024165939539670944, lr = 0.0001
[05:24:10] INFO - Epoch 17/50, Iter 31800: Loss = 0.015153701417148113, lr = 0.0001
[05:24:47] INFO - Epoch 18/50, Iter 31900: Loss = 0.015807051211595535, lr = 0.0001
[05:26:34] INFO - Epoch 18/50, Iter 32000: Loss = 0.024118462577462196, lr = 0.0001
[05:27:11] INFO - Epoch 18/50, Iter 32100: Loss = 0.02389802597463131, lr = 0.0001
[05:27:47] INFO - Epoch 18/50, Iter 32200: Loss = 0.012799250893294811, lr = 0.0001
[05:28:24] INFO - Epoch 18/50, Iter 32300: Loss = 0.022414622828364372, lr = 0.0001
[05:29:01] INFO - Epoch 18/50, Iter 32400: Loss = 0.012300081551074982, lr = 0.0001
[05:29:37] INFO - Epoch 18/50, Iter 32500: Loss = 0.022501520812511444, lr = 0.0001
[05:30:12] INFO - Epoch 18/50, Iter 32600: Loss = 0.02582414075732231, lr = 0.0001
[05:30:47] INFO - Epoch 18/50, Iter 32700: Loss = 0.014079990796744823, lr = 0.0001
[05:31:24] INFO - Epoch 18/50, Iter 32800: Loss = 0.019541800022125244, lr = 0.0001
[05:32:02] INFO - Epoch 18/50, Iter 32900: Loss = 0.018132250756025314, lr = 0.0001
[05:33:49] INFO - Epoch 18/50, Iter 33000: Loss = 0.026356974616646767, lr = 0.0001
[05:34:27] INFO - Epoch 18/50, Iter 33100: Loss = 0.022777386009693146, lr = 0.0001
[05:35:04] INFO - Epoch 18/50, Iter 33200: Loss = 0.019965749233961105, lr = 0.0001
[05:35:42] INFO - Epoch 18/50, Iter 33300: Loss = 0.025099262595176697, lr = 0.0001
[05:36:19] INFO - Epoch 18/50, Iter 33400: Loss = 0.023254601284861565, lr = 0.0001
[05:36:55] INFO - Epoch 18/50, Iter 33500: Loss = 0.019896823912858963, lr = 0.0001
[05:37:31] INFO - Epoch 18/50, Iter 33600: Loss = 0.024235250428318977, lr = 0.0001
[05:38:06] INFO - Epoch 18/50, Iter 33700: Loss = 0.02070479653775692, lr = 0.0001
[05:38:43] INFO - Epoch 19/50, Iter 33800: Loss = 0.035438623279333115, lr = 0.0001
[05:39:21] INFO - Epoch 19/50, Iter 33900: Loss = 0.027448982000350952, lr = 0.0001
[05:41:09] INFO - Epoch 19/50, Iter 34000: Loss = 0.018178656697273254, lr = 0.0001
[05:41:46] INFO - Epoch 19/50, Iter 34100: Loss = 0.038496233522892, lr = 0.0001
[05:42:24] INFO - Epoch 19/50, Iter 34200: Loss = 0.030291561037302017, lr = 0.0001
[05:43:01] INFO - Epoch 19/50, Iter 34300: Loss = 0.03536762297153473, lr = 0.0001
[05:43:38] INFO - Epoch 19/50, Iter 34400: Loss = 0.016288427636027336, lr = 0.0001
[05:44:16] INFO - Epoch 19/50, Iter 34500: Loss = 0.022963257506489754, lr = 0.0001
[05:44:53] INFO - Epoch 19/50, Iter 34600: Loss = 0.026906738057732582, lr = 0.0001
[05:45:28] INFO - Epoch 19/50, Iter 34700: Loss = 0.01948506198823452, lr = 0.0001
[05:46:02] INFO - Epoch 19/50, Iter 34800: Loss = 0.016246482729911804, lr = 0.0001
[05:46:40] INFO - Epoch 19/50, Iter 34900: Loss = 0.02436024695634842, lr = 0.0001
[05:48:27] INFO - Epoch 19/50, Iter 35000: Loss = 0.02122604288160801, lr = 0.0001
[05:49:04] INFO - Epoch 19/50, Iter 35100: Loss = 0.028715120628476143, lr = 0.0001
[05:49:42] INFO - Epoch 19/50, Iter 35200: Loss = 0.026141855865716934, lr = 0.0001
[05:50:19] INFO - Epoch 19/50, Iter 35300: Loss = 0.019213732331991196, lr = 0.0001
[05:50:56] INFO - Epoch 19/50, Iter 35400: Loss = 0.03243093192577362, lr = 0.0001
[05:51:33] INFO - Epoch 19/50, Iter 35500: Loss = 0.03266039490699768, lr = 0.0001
[05:52:09] INFO - Epoch 19/50, Iter 35600: Loss = 0.017232870683073997, lr = 0.0001
[05:52:46] INFO - Epoch 20/50, Iter 35700: Loss = 0.026399090886116028, lr = 0.0001
[05:53:22] INFO - Epoch 20/50, Iter 35800: Loss = 0.028520701453089714, lr = 0.0001
[05:53:58] INFO - Epoch 20/50, Iter 35900: Loss = 0.02605503797531128, lr = 0.0001
[05:55:46] INFO - Epoch 20/50, Iter 36000: Loss = 0.015452174469828606, lr = 0.0001
[05:56:23] INFO - Epoch 20/50, Iter 36100: Loss = 0.017282821238040924, lr = 0.0001
[05:57:01] INFO - Epoch 20/50, Iter 36200: Loss = 0.025303389877080917, lr = 0.0001
[05:57:38] INFO - Epoch 20/50, Iter 36300: Loss = 0.019291004166007042, lr = 0.0001
[05:58:15] INFO - Epoch 20/50, Iter 36400: Loss = 0.02849787101149559, lr = 0.0001
[05:58:53] INFO - Epoch 20/50, Iter 36500: Loss = 0.03238069638609886, lr = 0.0001
[05:59:30] INFO - Epoch 20/50, Iter 36600: Loss = 0.02071816474199295, lr = 0.0001
[06:00:07] INFO - Epoch 20/50, Iter 36700: Loss = 0.019271377474069595, lr = 0.0001
[06:00:42] INFO - Epoch 20/50, Iter 36800: Loss = 0.02762100100517273, lr = 0.0001
[06:01:17] INFO - Epoch 20/50, Iter 36900: Loss = 0.02517077326774597, lr = 0.0001
[06:03:04] INFO - Epoch 20/50, Iter 37000: Loss = 0.03359407186508179, lr = 0.0001
[06:03:42] INFO - Epoch 20/50, Iter 37100: Loss = 0.024368373677134514, lr = 0.0001
[06:04:19] INFO - Epoch 20/50, Iter 37200: Loss = 0.01826002635061741, lr = 0.0001
[06:04:57] INFO - Epoch 20/50, Iter 37300: Loss = 0.018539167940616608, lr = 0.0001
[06:05:33] INFO - Epoch 20/50, Iter 37400: Loss = 0.02147294208407402, lr = 0.0001
[06:06:11] INFO - Epoch 21/50, Iter 37500: Loss = 0.03047824651002884, lr = 0.0001
[06:06:48] INFO - Epoch 21/50, Iter 37600: Loss = 0.02184651419520378, lr = 0.0001
[06:07:26] INFO - Epoch 21/50, Iter 37700: Loss = 0.025026265531778336, lr = 0.0001
[06:08:02] INFO - Epoch 21/50, Iter 37800: Loss = 0.017012089490890503, lr = 0.0001
[06:08:38] INFO - Epoch 21/50, Iter 37900: Loss = 0.026773590594530106, lr = 0.0001
[06:10:24] INFO - Epoch 21/50, Iter 38000: Loss = 0.024802416563034058, lr = 0.0001
[06:11:01] INFO - Epoch 21/50, Iter 38100: Loss = 0.023794755339622498, lr = 0.0001
[06:11:39] INFO - Epoch 21/50, Iter 38200: Loss = 0.019931890070438385, lr = 0.0001
[06:12:16] INFO - Epoch 21/50, Iter 38300: Loss = 0.022862359881401062, lr = 0.0001
[06:12:53] INFO - Epoch 21/50, Iter 38400: Loss = 0.015643121674656868, lr = 0.0001
[06:13:31] INFO - Epoch 21/50, Iter 38500: Loss = 0.018159756436944008, lr = 0.0001
[06:14:08] INFO - Epoch 21/50, Iter 38600: Loss = 0.023093489930033684, lr = 0.0001
[06:14:45] INFO - Epoch 21/50, Iter 38700: Loss = 0.02346295490860939, lr = 0.0001
[06:15:23] INFO - Epoch 21/50, Iter 38800: Loss = 0.016494235023856163, lr = 0.0001
[06:15:58] INFO - Epoch 21/50, Iter 38900: Loss = 0.022135134786367416, lr = 0.0001
[06:17:42] INFO - Epoch 21/50, Iter 39000: Loss = 0.02312326431274414, lr = 0.0001
[06:18:19] INFO - Epoch 21/50, Iter 39100: Loss = 0.01600954681634903, lr = 0.0001
[06:18:57] INFO - Epoch 21/50, Iter 39200: Loss = 0.028728237375617027, lr = 0.0001
[06:19:34] INFO - Epoch 21/50, Iter 39300: Loss = 0.021084200590848923, lr = 0.0001
[06:20:11] INFO - Epoch 22/50, Iter 39400: Loss = 0.027077186852693558, lr = 0.0001
[06:20:49] INFO - Epoch 22/50, Iter 39500: Loss = 0.01724139414727688, lr = 0.0001
[06:21:26] INFO - Epoch 22/50, Iter 39600: Loss = 0.017984826117753983, lr = 0.0001
[06:22:03] INFO - Epoch 22/50, Iter 39700: Loss = 0.020777074620127678, lr = 0.0001
[06:22:41] INFO - Epoch 22/50, Iter 39800: Loss = 0.034250833094120026, lr = 0.0001
[06:23:18] INFO - Epoch 22/50, Iter 39900: Loss = 0.021932916715741158, lr = 0.0001
[06:25:00] INFO - Epoch 22/50, Iter 40000: Loss = 0.03071112185716629, lr = 0.0001
[06:25:38] INFO - Epoch 22/50, Iter 40100: Loss = 0.021631088107824326, lr = 0.0001
[06:26:15] INFO - Epoch 22/50, Iter 40200: Loss = 0.018738504499197006, lr = 0.0001
[06:26:53] INFO - Epoch 22/50, Iter 40300: Loss = 0.028383584693074226, lr = 0.0001
[06:27:30] INFO - Epoch 22/50, Iter 40400: Loss = 0.021290233358740807, lr = 0.0001
[06:28:07] INFO - Epoch 22/50, Iter 40500: Loss = 0.03446844965219498, lr = 0.0001
[06:28:45] INFO - Epoch 22/50, Iter 40600: Loss = 0.018756400793790817, lr = 0.0001
[06:29:22] INFO - Epoch 22/50, Iter 40700: Loss = 0.024726085364818573, lr = 0.0001
[06:30:00] INFO - Epoch 22/50, Iter 40800: Loss = 0.015223012305796146, lr = 0.0001
[06:30:37] INFO - Epoch 22/50, Iter 40900: Loss = 0.023908548057079315, lr = 0.0001
[06:32:19] INFO - Epoch 22/50, Iter 41000: Loss = 0.029199382290244102, lr = 0.0001
[06:32:56] INFO - Epoch 22/50, Iter 41100: Loss = 0.028144368901848793, lr = 0.0001
[06:33:34] INFO - Epoch 22/50, Iter 41200: Loss = 0.02745593711733818, lr = 0.0001
[06:34:12] INFO - Epoch 23/50, Iter 41300: Loss = 0.019279180094599724, lr = 0.0001
[06:34:49] INFO - Epoch 23/50, Iter 41400: Loss = 0.02318675071001053, lr = 0.0001
[06:35:26] INFO - Epoch 23/50, Iter 41500: Loss = 0.017886362969875336, lr = 0.0001
[06:36:03] INFO - Epoch 23/50, Iter 41600: Loss = 0.018750198185443878, lr = 0.0001
[06:36:41] INFO - Epoch 23/50, Iter 41700: Loss = 0.02191336825489998, lr = 0.0001
[06:37:18] INFO - Epoch 23/50, Iter 41800: Loss = 0.03157617896795273, lr = 0.0001
[06:37:55] INFO - Epoch 23/50, Iter 41900: Loss = 0.017570078372955322, lr = 0.0001
[06:39:38] INFO - Epoch 23/50, Iter 42000: Loss = 0.02058098092675209, lr = 0.0001
[06:40:15] INFO - Epoch 23/50, Iter 42100: Loss = 0.026018939912319183, lr = 0.0001
[06:40:52] INFO - Epoch 23/50, Iter 42200: Loss = 0.02059439942240715, lr = 0.0001
[06:41:30] INFO - Epoch 23/50, Iter 42300: Loss = 0.011693568900227547, lr = 0.0001
[06:42:07] INFO - Epoch 23/50, Iter 42400: Loss = 0.022519651800394058, lr = 0.0001
[06:42:44] INFO - Epoch 23/50, Iter 42500: Loss = 0.01847762055695057, lr = 0.0001
[06:43:22] INFO - Epoch 23/50, Iter 42600: Loss = 0.020165227353572845, lr = 0.0001
[06:43:59] INFO - Epoch 23/50, Iter 42700: Loss = 0.027182873338460922, lr = 0.0001
[06:44:36] INFO - Epoch 23/50, Iter 42800: Loss = 0.018888037651777267, lr = 0.0001
[06:45:14] INFO - Epoch 23/50, Iter 42900: Loss = 0.00990472175180912, lr = 0.0001
[06:46:58] INFO - Epoch 23/50, Iter 43000: Loss = 0.009258471429347992, lr = 0.0001
[06:47:33] INFO - Epoch 23/50, Iter 43100: Loss = 0.017583448439836502, lr = 0.0001
[06:48:12] INFO - Epoch 24/50, Iter 43200: Loss = 0.027309181168675423, lr = 0.0001
[06:48:50] INFO - Epoch 24/50, Iter 43300: Loss = 0.022596612572669983, lr = 0.0001
[06:49:27] INFO - Epoch 24/50, Iter 43400: Loss = 0.016877392306923866, lr = 0.0001
[06:50:04] INFO - Epoch 24/50, Iter 43500: Loss = 0.02063451148569584, lr = 0.0001
[06:50:42] INFO - Epoch 24/50, Iter 43600: Loss = 0.023637618869543076, lr = 0.0001
[06:51:19] INFO - Epoch 24/50, Iter 43700: Loss = 0.022452209144830704, lr = 0.0001
[06:51:56] INFO - Epoch 24/50, Iter 43800: Loss = 0.019610881805419922, lr = 0.0001
[06:52:34] INFO - Epoch 24/50, Iter 43900: Loss = 0.02145165205001831, lr = 0.0001
[06:54:18] INFO - Epoch 24/50, Iter 44000: Loss = 0.021221479400992393, lr = 0.0001
[06:54:53] INFO - Epoch 24/50, Iter 44100: Loss = 0.018081754446029663, lr = 0.0001
[06:55:30] INFO - Epoch 24/50, Iter 44200: Loss = 0.019172552973031998, lr = 0.0001
[06:56:07] INFO - Epoch 24/50, Iter 44300: Loss = 0.029354147613048553, lr = 0.0001
[06:56:45] INFO - Epoch 24/50, Iter 44400: Loss = 0.02133547142148018, lr = 0.0001
[06:57:22] INFO - Epoch 24/50, Iter 44500: Loss = 0.03115892969071865, lr = 0.0001
[06:57:59] INFO - Epoch 24/50, Iter 44600: Loss = 0.028472255915403366, lr = 0.0001
[06:58:37] INFO - Epoch 24/50, Iter 44700: Loss = 0.01984764076769352, lr = 0.0001
[06:59:14] INFO - Epoch 24/50, Iter 44800: Loss = 0.020234258845448494, lr = 0.0001
[06:59:51] INFO - Epoch 24/50, Iter 44900: Loss = 0.013643868267536163, lr = 0.0001
[07:01:38] INFO - Epoch 25/50, Iter 45000: Loss = 0.020893389359116554, lr = 0.0001
[07:02:14] INFO - Epoch 25/50, Iter 45100: Loss = 0.018400561064481735, lr = 0.0001
[07:02:49] INFO - Epoch 25/50, Iter 45200: Loss = 0.024892032146453857, lr = 0.0001
[07:03:28] INFO - Epoch 25/50, Iter 45300: Loss = 0.02168758027255535, lr = 0.0001
[07:04:04] INFO - Epoch 25/50, Iter 45400: Loss = 0.014965218491852283, lr = 0.0001
[07:04:42] INFO - Epoch 25/50, Iter 45500: Loss = 0.016451682895421982, lr = 0.0001
[07:05:19] INFO - Epoch 25/50, Iter 45600: Loss = 0.01958932727575302, lr = 0.0001
[07:05:57] INFO - Epoch 25/50, Iter 45700: Loss = 0.02093309909105301, lr = 0.0001
[07:06:34] INFO - Epoch 25/50, Iter 45800: Loss = 0.019978303462266922, lr = 0.0001
[07:07:11] INFO - Epoch 25/50, Iter 45900: Loss = 0.026181869208812714, lr = 0.0001
[07:08:57] INFO - Epoch 25/50, Iter 46000: Loss = 0.01811271533370018, lr = 0.0001
[07:09:33] INFO - Epoch 25/50, Iter 46100: Loss = 0.01941503770649433, lr = 0.0001
[07:10:08] INFO - Epoch 25/50, Iter 46200: Loss = 0.02309822291135788, lr = 0.0001
[07:10:43] INFO - Epoch 25/50, Iter 46300: Loss = 0.019712526351213455, lr = 0.0001
[07:11:21] INFO - Epoch 25/50, Iter 46400: Loss = 0.02885950542986393, lr = 0.0001
[07:11:58] INFO - Epoch 25/50, Iter 46500: Loss = 0.022054243832826614, lr = 0.0001
[07:12:36] INFO - Epoch 25/50, Iter 46600: Loss = 0.020716888830065727, lr = 0.0001
[07:13:13] INFO - Epoch 25/50, Iter 46700: Loss = 0.029608381912112236, lr = 0.0001
[07:13:50] INFO - Epoch 25/50, Iter 46800: Loss = 0.031893111765384674, lr = 0.0001
[07:14:29] INFO - Epoch 26/50, Iter 46900: Loss = 0.018023375421762466, lr = 0.0001
[07:16:17] INFO - Epoch 26/50, Iter 47000: Loss = 0.021756181493401527, lr = 0.0001
[07:16:54] INFO - Epoch 26/50, Iter 47100: Loss = 0.014003759250044823, lr = 0.0001
[07:17:28] INFO - Epoch 26/50, Iter 47200: Loss = 0.02504022791981697, lr = 0.0001
[07:18:03] INFO - Epoch 26/50, Iter 47300: Loss = 0.022718233987689018, lr = 0.0001
[07:18:39] INFO - Epoch 26/50, Iter 47400: Loss = 0.022739659994840622, lr = 0.0001
[07:19:16] INFO - Epoch 26/50, Iter 47500: Loss = 0.01982242986559868, lr = 0.0001
[07:19:53] INFO - Epoch 26/50, Iter 47600: Loss = 0.023511618375778198, lr = 0.0001
[07:20:30] INFO - Epoch 26/50, Iter 47700: Loss = 0.02158450335264206, lr = 0.0001
[07:21:06] INFO - Epoch 26/50, Iter 47800: Loss = 0.0194215290248394, lr = 0.0001
[07:21:43] INFO - Epoch 26/50, Iter 47900: Loss = 0.01607697084546089, lr = 0.0001
[07:23:29] INFO - Epoch 26/50, Iter 48000: Loss = 0.031847916543483734, lr = 0.0001
[07:24:06] INFO - Epoch 26/50, Iter 48100: Loss = 0.016561947762966156, lr = 0.0001
[07:24:42] INFO - Epoch 26/50, Iter 48200: Loss = 0.022396143525838852, lr = 0.0001
[07:25:17] INFO - Epoch 26/50, Iter 48300: Loss = 0.014768151566386223, lr = 0.0001
[07:25:52] INFO - Epoch 26/50, Iter 48400: Loss = 0.017738102003932, lr = 0.0001
[07:26:29] INFO - Epoch 26/50, Iter 48500: Loss = 0.02863166481256485, lr = 0.0001
[07:27:06] INFO - Epoch 26/50, Iter 48600: Loss = 0.020090758800506592, lr = 0.0001
[07:27:43] INFO - Epoch 26/50, Iter 48700: Loss = 0.025523288175463676, lr = 0.0001
[07:28:22] INFO - Epoch 27/50, Iter 48800: Loss = 0.015607817098498344, lr = 0.0001
[07:29:00] INFO - Epoch 27/50, Iter 48900: Loss = 0.01831909641623497, lr = 0.0001
[07:30:48] INFO - Epoch 27/50, Iter 49000: Loss = 0.020194053649902344, lr = 0.0001
[07:31:25] INFO - Epoch 27/50, Iter 49100: Loss = 0.016583867371082306, lr = 0.0001
[07:32:01] INFO - Epoch 27/50, Iter 49200: Loss = 0.025016678497195244, lr = 0.0001
[07:32:37] INFO - Epoch 27/50, Iter 49300: Loss = 0.019450880587100983, lr = 0.0001
[07:33:12] INFO - Epoch 27/50, Iter 49400: Loss = 0.019358769059181213, lr = 0.0001
[07:33:47] INFO - Epoch 27/50, Iter 49500: Loss = 0.02399422787129879, lr = 0.0001
[07:34:25] INFO - Epoch 27/50, Iter 49600: Loss = 0.022624319419264793, lr = 0.0001
[07:35:02] INFO - Epoch 27/50, Iter 49700: Loss = 0.018581345677375793, lr = 0.0001
[07:35:40] INFO - Epoch 27/50, Iter 49800: Loss = 0.03396957740187645, lr = 0.0001
[07:36:17] INFO - Epoch 27/50, Iter 49900: Loss = 0.01653345674276352, lr = 0.0001
[07:38:04] INFO - Epoch 27/50, Iter 50000: Loss = 0.020367326214909554, lr = 0.0001
[07:38:42] INFO - Epoch 27/50, Iter 50100: Loss = 0.026802118867635727, lr = 0.0001
[07:39:19] INFO - Epoch 27/50, Iter 50200: Loss = 0.02551976591348648, lr = 0.0001
[07:39:57] INFO - Epoch 27/50, Iter 50300: Loss = 0.026955192908644676, lr = 0.0001
[07:40:31] INFO - Epoch 27/50, Iter 50400: Loss = 0.030265633016824722, lr = 0.0001
[07:41:06] INFO - Epoch 27/50, Iter 50500: Loss = 0.02354291081428528, lr = 0.0001
[07:41:43] INFO - Epoch 27/50, Iter 50600: Loss = 0.014263815246522427, lr = 0.0001
[07:42:21] INFO - Epoch 28/50, Iter 50700: Loss = 0.026106689125299454, lr = 0.0001
[07:42:59] INFO - Epoch 28/50, Iter 50800: Loss = 0.02534874901175499, lr = 0.0001
[07:43:37] INFO - Epoch 28/50, Iter 50900: Loss = 0.02099444344639778, lr = 0.0001
[07:45:25] INFO - Epoch 28/50, Iter 51000: Loss = 0.021261703222990036, lr = 0.0001
[07:46:02] INFO - Epoch 28/50, Iter 51100: Loss = 0.016304541379213333, lr = 0.0001
[07:46:39] INFO - Epoch 28/50, Iter 51200: Loss = 0.020184708759188652, lr = 0.0001
[07:47:15] INFO - Epoch 28/50, Iter 51300: Loss = 0.01964147947728634, lr = 0.0001
[07:47:51] INFO - Epoch 28/50, Iter 51400: Loss = 0.016097456216812134, lr = 0.0001
[07:48:26] INFO - Epoch 28/50, Iter 51500: Loss = 0.018887262791395187, lr = 0.0001
[07:49:01] INFO - Epoch 28/50, Iter 51600: Loss = 0.03289520740509033, lr = 0.0001
[07:49:39] INFO - Epoch 28/50, Iter 51700: Loss = 0.02468728832900524, lr = 0.0001
[07:50:16] INFO - Epoch 28/50, Iter 51800: Loss = 0.020057909190654755, lr = 0.0001
[07:50:54] INFO - Epoch 28/50, Iter 51900: Loss = 0.020394371822476387, lr = 0.0001
[07:52:41] INFO - Epoch 28/50, Iter 52000: Loss = 0.02179614081978798, lr = 0.0001
[07:53:18] INFO - Epoch 28/50, Iter 52100: Loss = 0.018156271427869797, lr = 0.0001
[07:53:55] INFO - Epoch 28/50, Iter 52200: Loss = 0.02341829240322113, lr = 0.0001
[07:54:33] INFO - Epoch 28/50, Iter 52300: Loss = 0.016954025253653526, lr = 0.0001
[07:55:10] INFO - Epoch 28/50, Iter 52400: Loss = 0.026269305497407913, lr = 0.0001
[07:55:46] INFO - Epoch 29/50, Iter 52500: Loss = 0.01687164232134819, lr = 0.0001
[07:56:21] INFO - Epoch 29/50, Iter 52600: Loss = 0.01376437209546566, lr = 0.0001
[07:56:58] INFO - Epoch 29/50, Iter 52700: Loss = 0.021159611642360687, lr = 0.0001
[07:57:36] INFO - Epoch 29/50, Iter 52800: Loss = 0.015487756580114365, lr = 0.0001
[07:58:14] INFO - Epoch 29/50, Iter 52900: Loss = 0.025838203728199005, lr = 0.0001
[08:00:02] INFO - Epoch 29/50, Iter 53000: Loss = 0.02396319806575775, lr = 0.0001
[08:00:39] INFO - Epoch 29/50, Iter 53100: Loss = 0.019110538065433502, lr = 0.0001
[08:01:16] INFO - Epoch 29/50, Iter 53200: Loss = 0.01159975677728653, lr = 0.0001
[08:01:53] INFO - Epoch 29/50, Iter 53300: Loss = 0.03230958431959152, lr = 0.0001
[08:02:29] INFO - Epoch 29/50, Iter 53400: Loss = 0.022003935649991035, lr = 0.0001
[08:03:06] INFO - Epoch 29/50, Iter 53500: Loss = 0.011917732656002045, lr = 0.0001
[08:03:40] INFO - Epoch 29/50, Iter 53600: Loss = 0.024439413100481033, lr = 0.0001
[08:04:15] INFO - Epoch 29/50, Iter 53700: Loss = 0.02025175467133522, lr = 0.0001
[08:04:52] INFO - Epoch 29/50, Iter 53800: Loss = 0.017246924340724945, lr = 0.0001
[08:05:30] INFO - Epoch 29/50, Iter 53900: Loss = 0.030383361503481865, lr = 0.0001
[08:07:17] INFO - Epoch 29/50, Iter 54000: Loss = 0.01954091340303421, lr = 0.0001
[08:07:54] INFO - Epoch 29/50, Iter 54100: Loss = 0.0225138571113348, lr = 0.0001
[08:08:32] INFO - Epoch 29/50, Iter 54200: Loss = 0.01854889467358589, lr = 0.0001
[08:09:09] INFO - Epoch 29/50, Iter 54300: Loss = 0.027329208329319954, lr = 0.0001
[08:09:47] INFO - Epoch 30/50, Iter 54400: Loss = 0.02209412306547165, lr = 0.0001
[08:10:25] INFO - Epoch 30/50, Iter 54500: Loss = 0.02240779995918274, lr = 0.0001
[08:11:01] INFO - Epoch 30/50, Iter 54600: Loss = 0.016268890351057053, lr = 0.0001
[08:11:37] INFO - Epoch 30/50, Iter 54700: Loss = 0.020547280088067055, lr = 0.0001
[08:12:14] INFO - Epoch 30/50, Iter 54800: Loss = 0.025404835119843483, lr = 0.0001
[08:12:52] INFO - Epoch 30/50, Iter 54900: Loss = 0.04109298810362816, lr = 0.0001
[08:14:39] INFO - Epoch 30/50, Iter 55000: Loss = 0.025483297184109688, lr = 0.0001
[08:15:16] INFO - Epoch 30/50, Iter 55100: Loss = 0.02378198504447937, lr = 0.0001
[08:15:53] INFO - Epoch 30/50, Iter 55200: Loss = 0.02577335573732853, lr = 0.0001
[08:16:30] INFO - Epoch 30/50, Iter 55300: Loss = 0.018335986882448196, lr = 0.0001
[08:17:06] INFO - Epoch 30/50, Iter 55400: Loss = 0.018661705777049065, lr = 0.0001
[08:17:43] INFO - Epoch 30/50, Iter 55500: Loss = 0.016169201582670212, lr = 0.0001
[08:18:20] INFO - Epoch 30/50, Iter 55600: Loss = 0.029093626886606216, lr = 0.0001
[08:18:55] INFO - Epoch 30/50, Iter 55700: Loss = 0.01622368022799492, lr = 0.0001
[08:19:29] INFO - Epoch 30/50, Iter 55800: Loss = 0.012564092874526978, lr = 0.0001
[08:20:06] INFO - Epoch 30/50, Iter 55900: Loss = 0.03472227603197098, lr = 0.0001
[08:21:54] INFO - Epoch 30/50, Iter 56000: Loss = 0.025271758437156677, lr = 0.0001
[08:22:31] INFO - Epoch 30/50, Iter 56100: Loss = 0.015396498143672943, lr = 0.0001
[08:23:08] INFO - Epoch 30/50, Iter 56200: Loss = 0.015089810825884342, lr = 0.0001
[08:23:47] INFO - Epoch 31/50, Iter 56300: Loss = 0.022155551239848137, lr = 0.0001
[08:24:25] INFO - Epoch 31/50, Iter 56400: Loss = 0.023600995540618896, lr = 0.0001
[08:25:03] INFO - Epoch 31/50, Iter 56500: Loss = 0.014499511569738388, lr = 0.0001
[08:25:41] INFO - Epoch 31/50, Iter 56600: Loss = 0.01854860782623291, lr = 0.0001
[08:26:17] INFO - Epoch 31/50, Iter 56700: Loss = 0.014885067008435726, lr = 0.0001
[08:26:52] INFO - Epoch 31/50, Iter 56800: Loss = 0.02499360591173172, lr = 0.0001
[08:27:29] INFO - Epoch 31/50, Iter 56900: Loss = 0.019067181274294853, lr = 0.0001
[08:29:17] INFO - Epoch 31/50, Iter 57000: Loss = 0.016186274588108063, lr = 0.0001
[08:29:53] INFO - Epoch 31/50, Iter 57100: Loss = 0.018789513036608696, lr = 0.0001
[08:30:30] INFO - Epoch 31/50, Iter 57200: Loss = 0.02824380248785019, lr = 0.0001
[08:31:07] INFO - Epoch 31/50, Iter 57300: Loss = 0.014734972268342972, lr = 0.0001
[08:31:44] INFO - Epoch 31/50, Iter 57400: Loss = 0.027844443917274475, lr = 0.0001
[08:32:20] INFO - Epoch 31/50, Iter 57500: Loss = 0.017645347863435745, lr = 0.0001
[08:32:57] INFO - Epoch 31/50, Iter 57600: Loss = 0.026852741837501526, lr = 0.0001
[08:33:34] INFO - Epoch 31/50, Iter 57700: Loss = 0.018187761306762695, lr = 0.0001
[08:34:09] INFO - Epoch 31/50, Iter 57800: Loss = 0.015949510037899017, lr = 0.0001
[08:34:44] INFO - Epoch 31/50, Iter 57900: Loss = 0.030537914484739304, lr = 0.0001
[08:36:30] INFO - Epoch 31/50, Iter 58000: Loss = 0.023328498005867004, lr = 0.0001
[08:37:08] INFO - Epoch 31/50, Iter 58100: Loss = 0.0321945920586586, lr = 0.0001
[08:37:46] INFO - Epoch 32/50, Iter 58200: Loss = 0.021406956017017365, lr = 0.0001
[08:38:24] INFO - Epoch 32/50, Iter 58300: Loss = 0.024833301082253456, lr = 0.0001
[08:39:02] INFO - Epoch 32/50, Iter 58400: Loss = 0.02409757860004902, lr = 0.0001
[08:39:40] INFO - Epoch 32/50, Iter 58500: Loss = 0.02115483582019806, lr = 0.0001
[08:40:18] INFO - Epoch 32/50, Iter 58600: Loss = 0.028434213250875473, lr = 0.0001
[08:40:56] INFO - Epoch 32/50, Iter 58700: Loss = 0.01535562239587307, lr = 0.0001
[08:41:33] INFO - Epoch 32/50, Iter 58800: Loss = 0.018513666465878487, lr = 0.0001
[08:42:09] INFO - Epoch 32/50, Iter 58900: Loss = 0.01970413699746132, lr = 0.0001
[08:43:55] INFO - Epoch 32/50, Iter 59000: Loss = 0.023043164983391762, lr = 0.0001
[08:44:31] INFO - Epoch 32/50, Iter 59100: Loss = 0.022449225187301636, lr = 0.0001
[08:45:08] INFO - Epoch 32/50, Iter 59200: Loss = 0.02532496303319931, lr = 0.0001
[08:45:44] INFO - Epoch 32/50, Iter 59300: Loss = 0.01836356148123741, lr = 0.0001
[08:46:21] INFO - Epoch 32/50, Iter 59400: Loss = 0.023496415466070175, lr = 0.0001
[08:46:58] INFO - Epoch 32/50, Iter 59500: Loss = 0.021977299824357033, lr = 0.0001
[08:47:35] INFO - Epoch 32/50, Iter 59600: Loss = 0.01530459150671959, lr = 0.0001
[08:48:11] INFO - Epoch 32/50, Iter 59700: Loss = 0.018574871122837067, lr = 0.0001
[08:48:48] INFO - Epoch 32/50, Iter 59800: Loss = 0.01716908998787403, lr = 0.0001
[08:49:24] INFO - Epoch 32/50, Iter 59900: Loss = 0.02111116237938404, lr = 0.0001
[08:51:08] INFO - Epoch 33/50, Iter 60000: Loss = 0.018158450722694397, lr = 0.0001
[08:51:46] INFO - Epoch 33/50, Iter 60100: Loss = 0.026417307555675507, lr = 0.0001
[08:52:24] INFO - Epoch 33/50, Iter 60200: Loss = 0.018158096820116043, lr = 0.0001
[08:53:02] INFO - Epoch 33/50, Iter 60300: Loss = 0.016817064955830574, lr = 0.0001
[08:53:40] INFO - Epoch 33/50, Iter 60400: Loss = 0.02153771184384823, lr = 0.0001
[08:54:18] INFO - Epoch 33/50, Iter 60500: Loss = 0.022119596600532532, lr = 0.0001
[08:54:56] INFO - Epoch 33/50, Iter 60600: Loss = 0.019562236964702606, lr = 0.0001
[08:55:34] INFO - Epoch 33/50, Iter 60700: Loss = 0.020703531801700592, lr = 0.0001
[08:56:12] INFO - Epoch 33/50, Iter 60800: Loss = 0.016628460958600044, lr = 0.0001
[08:56:50] INFO - Epoch 33/50, Iter 60900: Loss = 0.02273157238960266, lr = 0.0001
[08:58:33] INFO - Epoch 33/50, Iter 61000: Loss = 0.024464242160320282, lr = 0.0001
[08:59:09] INFO - Epoch 33/50, Iter 61100: Loss = 0.013031220994889736, lr = 0.0001
[08:59:46] INFO - Epoch 33/50, Iter 61200: Loss = 0.021556008607149124, lr = 0.0001
[09:00:23] INFO - Epoch 33/50, Iter 61300: Loss = 0.029755286872386932, lr = 0.0001
[09:00:59] INFO - Epoch 33/50, Iter 61400: Loss = 0.032875772565603256, lr = 0.0001
[09:01:36] INFO - Epoch 33/50, Iter 61500: Loss = 0.025967784225940704, lr = 0.0001
[09:02:13] INFO - Epoch 33/50, Iter 61600: Loss = 0.030686652287840843, lr = 0.0001
[09:02:50] INFO - Epoch 33/50, Iter 61700: Loss = 0.024082669988274574, lr = 0.0001
[09:03:27] INFO - Epoch 33/50, Iter 61800: Loss = 0.030128881335258484, lr = 0.0001
[09:04:04] INFO - Epoch 34/50, Iter 61900: Loss = 0.025132764130830765, lr = 0.0001
[09:05:47] INFO - Epoch 34/50, Iter 62000: Loss = 0.022055231034755707, lr = 0.0001
[09:06:24] INFO - Epoch 34/50, Iter 62100: Loss = 0.03396378830075264, lr = 0.0001
[09:07:01] INFO - Epoch 34/50, Iter 62200: Loss = 0.023605257272720337, lr = 0.0001
[09:07:39] INFO - Epoch 34/50, Iter 62300: Loss = 0.020592767745256424, lr = 0.0001
[09:08:16] INFO - Epoch 34/50, Iter 62400: Loss = 0.02211090177297592, lr = 0.0001
[09:08:54] INFO - Epoch 34/50, Iter 62500: Loss = 0.01478223130106926, lr = 0.0001
[09:09:31] INFO - Epoch 34/50, Iter 62600: Loss = 0.024198908358812332, lr = 0.0001
[09:10:09] INFO - Epoch 34/50, Iter 62700: Loss = 0.01895963028073311, lr = 0.0001
[09:10:46] INFO - Epoch 34/50, Iter 62800: Loss = 0.01958467997610569, lr = 0.0001
[09:11:24] INFO - Epoch 34/50, Iter 62900: Loss = 0.03069506585597992, lr = 0.0001
[09:13:07] INFO - Epoch 34/50, Iter 63000: Loss = 0.02130581997334957, lr = 0.0001
[09:13:42] INFO - Epoch 34/50, Iter 63100: Loss = 0.02590073272585869, lr = 0.0001
[09:14:19] INFO - Epoch 34/50, Iter 63200: Loss = 0.01849909871816635, lr = 0.0001
[09:14:56] INFO - Epoch 34/50, Iter 63300: Loss = 0.023221593350172043, lr = 0.0001
[09:15:33] INFO - Epoch 34/50, Iter 63400: Loss = 0.03609362989664078, lr = 0.0001
[09:16:10] INFO - Epoch 34/50, Iter 63500: Loss = 0.020269108936190605, lr = 0.0001
[09:16:46] INFO - Epoch 34/50, Iter 63600: Loss = 0.02487366460263729, lr = 0.0001
[09:17:23] INFO - Epoch 34/50, Iter 63700: Loss = 0.020187098532915115, lr = 0.0001
[09:18:01] INFO - Epoch 35/50, Iter 63800: Loss = 0.017752237617969513, lr = 0.0001
[09:18:38] INFO - Epoch 35/50, Iter 63900: Loss = 0.021988939493894577, lr = 0.0001
[09:20:23] INFO - Epoch 35/50, Iter 64000: Loss = 0.021837353706359863, lr = 0.0001
[09:20:58] INFO - Epoch 35/50, Iter 64100: Loss = 0.027255743741989136, lr = 0.0001
[09:21:34] INFO - Epoch 35/50, Iter 64200: Loss = 0.016279345378279686, lr = 0.0001
[09:22:12] INFO - Epoch 35/50, Iter 64300: Loss = 0.021551430225372314, lr = 0.0001
[09:22:49] INFO - Epoch 35/50, Iter 64400: Loss = 0.02154885232448578, lr = 0.0001
[09:23:27] INFO - Epoch 35/50, Iter 64500: Loss = 0.023760154843330383, lr = 0.0001
[09:24:04] INFO - Epoch 35/50, Iter 64600: Loss = 0.02199278213083744, lr = 0.0001
[09:24:42] INFO - Epoch 35/50, Iter 64700: Loss = 0.023603856563568115, lr = 0.0001
[09:25:19] INFO - Epoch 35/50, Iter 64800: Loss = 0.028215087950229645, lr = 0.0001
[09:25:57] INFO - Epoch 35/50, Iter 64900: Loss = 0.019689366221427917, lr = 0.0001
[09:27:42] INFO - Epoch 35/50, Iter 65000: Loss = 0.03234357759356499, lr = 0.0001
[09:28:17] INFO - Epoch 35/50, Iter 65100: Loss = 0.020737197250127792, lr = 0.0001
[09:28:52] INFO - Epoch 35/50, Iter 65200: Loss = 0.017809413373470306, lr = 0.0001
[09:29:29] INFO - Epoch 35/50, Iter 65300: Loss = 0.02523978427052498, lr = 0.0001
[09:30:07] INFO - Epoch 35/50, Iter 65400: Loss = 0.019607078284025192, lr = 0.0001
[09:30:44] INFO - Epoch 35/50, Iter 65500: Loss = 0.021371446549892426, lr = 0.0001
[09:31:22] INFO - Epoch 35/50, Iter 65600: Loss = 0.020804964005947113, lr = 0.0001
[09:32:00] INFO - Epoch 36/50, Iter 65700: Loss = 0.021034738048911095, lr = 0.0001
[09:32:38] INFO - Epoch 36/50, Iter 65800: Loss = 0.018361229449510574, lr = 0.0001
[09:33:16] INFO - Epoch 36/50, Iter 65900: Loss = 0.019015271216630936, lr = 0.0001
[09:35:05] INFO - Epoch 36/50, Iter 66000: Loss = 0.022577553987503052, lr = 0.0001
[09:35:40] INFO - Epoch 36/50, Iter 66100: Loss = 0.009200166910886765, lr = 0.0001
[09:36:14] INFO - Epoch 36/50, Iter 66200: Loss = 0.02068813145160675, lr = 0.0001
[09:36:51] INFO - Epoch 36/50, Iter 66300: Loss = 0.01857619732618332, lr = 0.0001
[09:37:28] INFO - Epoch 36/50, Iter 66400: Loss = 0.02619405835866928, lr = 0.0001
[09:38:06] INFO - Epoch 36/50, Iter 66500: Loss = 0.01501368172466755, lr = 0.0001
[09:38:43] INFO - Epoch 36/50, Iter 66600: Loss = 0.01750001311302185, lr = 0.0001
[09:39:21] INFO - Epoch 36/50, Iter 66700: Loss = 0.027220875024795532, lr = 0.0001
[09:39:58] INFO - Epoch 36/50, Iter 66800: Loss = 0.012615697458386421, lr = 0.0001
[09:40:35] INFO - Epoch 36/50, Iter 66900: Loss = 0.017686940729618073, lr = 0.0001
[09:42:21] INFO - Epoch 36/50, Iter 67000: Loss = 0.027093440294265747, lr = 0.0001
[09:42:58] INFO - Epoch 36/50, Iter 67100: Loss = 0.03175349906086922, lr = 0.0001
[09:43:32] INFO - Epoch 36/50, Iter 67200: Loss = 0.016025781631469727, lr = 0.0001
[09:44:07] INFO - Epoch 36/50, Iter 67300: Loss = 0.01850888319313526, lr = 0.0001
[09:44:45] INFO - Epoch 36/50, Iter 67400: Loss = 0.017480308189988136, lr = 0.0001
[09:45:23] INFO - Epoch 37/50, Iter 67500: Loss = 0.025209972634911537, lr = 0.0001
[09:46:01] INFO - Epoch 37/50, Iter 67600: Loss = 0.02159825712442398, lr = 0.0001
[09:46:39] INFO - Epoch 37/50, Iter 67700: Loss = 0.023625709116458893, lr = 0.0001
[09:47:17] INFO - Epoch 37/50, Iter 67800: Loss = 0.02304173819720745, lr = 0.0001
[09:47:55] INFO - Epoch 37/50, Iter 67900: Loss = 0.027355562895536423, lr = 0.0001
[09:49:43] INFO - Epoch 37/50, Iter 68000: Loss = 0.016158344224095345, lr = 0.0001
[09:50:21] INFO - Epoch 37/50, Iter 68100: Loss = 0.028835609555244446, lr = 0.0001
[09:50:56] INFO - Epoch 37/50, Iter 68200: Loss = 0.018121257424354553, lr = 0.0001
[09:51:31] INFO - Epoch 37/50, Iter 68300: Loss = 0.02724415808916092, lr = 0.0001
[09:52:07] INFO - Epoch 37/50, Iter 68400: Loss = 0.022671695798635483, lr = 0.0001
[09:52:45] INFO - Epoch 37/50, Iter 68500: Loss = 0.03411524370312691, lr = 0.0001
[09:53:22] INFO - Epoch 37/50, Iter 68600: Loss = 0.029655056074261665, lr = 0.0001
[09:53:59] INFO - Epoch 37/50, Iter 68700: Loss = 0.01793760247528553, lr = 0.0001
[09:54:37] INFO - Epoch 37/50, Iter 68800: Loss = 0.02609744668006897, lr = 0.0001
[09:55:14] INFO - Epoch 37/50, Iter 68900: Loss = 0.02326042577624321, lr = 0.0001
[09:57:00] INFO - Epoch 37/50, Iter 69000: Loss = 0.02808242477476597, lr = 0.0001
[09:57:37] INFO - Epoch 37/50, Iter 69100: Loss = 0.018454603850841522, lr = 0.0001
[09:58:14] INFO - Epoch 37/50, Iter 69200: Loss = 0.0236714668571949, lr = 0.0001
[09:58:48] INFO - Epoch 37/50, Iter 69300: Loss = 0.02115646004676819, lr = 0.0001
[09:59:24] INFO - Epoch 38/50, Iter 69400: Loss = 0.025313185527920723, lr = 0.0001
[10:00:01] INFO - Epoch 38/50, Iter 69500: Loss = 0.017547637224197388, lr = 0.0001
[10:00:39] INFO - Epoch 38/50, Iter 69600: Loss = 0.016801120713353157, lr = 0.0001
[10:01:17] INFO - Epoch 38/50, Iter 69700: Loss = 0.028473760932683945, lr = 0.0001
[10:01:55] INFO - Epoch 38/50, Iter 69800: Loss = 0.02027265354990959, lr = 0.0001
[10:02:33] INFO - Epoch 38/50, Iter 69900: Loss = 0.02449711039662361, lr = 0.0001
[10:04:22] INFO - Epoch 38/50, Iter 70000: Loss = 0.024156518280506134, lr = 0.0001
[10:04:59] INFO - Epoch 38/50, Iter 70100: Loss = 0.020525965839624405, lr = 0.0001
[10:05:37] INFO - Epoch 38/50, Iter 70200: Loss = 0.022750582545995712, lr = 0.0001
[10:06:12] INFO - Epoch 38/50, Iter 70300: Loss = 0.020152883604168892, lr = 0.0001
[10:06:47] INFO - Epoch 38/50, Iter 70400: Loss = 0.020488817244768143, lr = 0.0001
[10:07:23] INFO - Epoch 38/50, Iter 70500: Loss = 0.02505185827612877, lr = 0.0001
[10:08:00] INFO - Epoch 38/50, Iter 70600: Loss = 0.022866712883114815, lr = 0.0001
[10:08:38] INFO - Epoch 38/50, Iter 70700: Loss = 0.015947509557008743, lr = 0.0001
[10:09:15] INFO - Epoch 38/50, Iter 70800: Loss = 0.016218503937125206, lr = 0.0001
[10:09:53] INFO - Epoch 38/50, Iter 70900: Loss = 0.02521585300564766, lr = 0.0001
[10:11:39] INFO - Epoch 38/50, Iter 71000: Loss = 0.01854109577834606, lr = 0.0001
[10:12:15] INFO - Epoch 38/50, Iter 71100: Loss = 0.019408322870731354, lr = 0.0001
[10:12:52] INFO - Epoch 38/50, Iter 71200: Loss = 0.01332402229309082, lr = 0.0001
[10:13:30] INFO - Epoch 39/50, Iter 71300: Loss = 0.02230134978890419, lr = 0.0001
[10:14:06] INFO - Epoch 39/50, Iter 71400: Loss = 0.025569632649421692, lr = 0.0001
[10:14:41] INFO - Epoch 39/50, Iter 71500: Loss = 0.025923438370227814, lr = 0.0001
[10:15:18] INFO - Epoch 39/50, Iter 71600: Loss = 0.025623483583331108, lr = 0.0001
[10:15:56] INFO - Epoch 39/50, Iter 71700: Loss = 0.02185159921646118, lr = 0.0001
[10:16:35] INFO - Epoch 39/50, Iter 71800: Loss = 0.028699517250061035, lr = 0.0001
[10:17:13] INFO - Epoch 39/50, Iter 71900: Loss = 0.020399484783411026, lr = 0.0001
[10:19:01] INFO - Epoch 39/50, Iter 72000: Loss = 0.018890781328082085, lr = 0.0001
[10:19:38] INFO - Epoch 39/50, Iter 72100: Loss = 0.019233493134379387, lr = 0.0001
[10:20:16] INFO - Epoch 39/50, Iter 72200: Loss = 0.02685868740081787, lr = 0.0001
[10:20:53] INFO - Epoch 39/50, Iter 72300: Loss = 0.01708034612238407, lr = 0.0001
[10:21:30] INFO - Epoch 39/50, Iter 72400: Loss = 0.01932934671640396, lr = 0.0001
[10:22:04] INFO - Epoch 39/50, Iter 72500: Loss = 0.01994146592915058, lr = 0.0001
[10:22:40] INFO - Epoch 39/50, Iter 72600: Loss = 0.030141036957502365, lr = 0.0001
[10:23:18] INFO - Epoch 39/50, Iter 72700: Loss = 0.01653864048421383, lr = 0.0001
[10:23:55] INFO - Epoch 39/50, Iter 72800: Loss = 0.01582333818078041, lr = 0.0001
[10:24:32] INFO - Epoch 39/50, Iter 72900: Loss = 0.030131559818983078, lr = 0.0001
[10:26:18] INFO - Epoch 39/50, Iter 73000: Loss = 0.020023521035909653, lr = 0.0001
[10:26:55] INFO - Epoch 39/50, Iter 73100: Loss = 0.023662405088543892, lr = 0.0001
[10:27:33] INFO - Epoch 40/50, Iter 73200: Loss = 0.023484613746404648, lr = 0.0001
[10:28:10] INFO - Epoch 40/50, Iter 73300: Loss = 0.017320852726697922, lr = 0.0001
[10:28:48] INFO - Epoch 40/50, Iter 73400: Loss = 0.019257768988609314, lr = 0.0001
[10:29:23] INFO - Epoch 40/50, Iter 73500: Loss = 0.026130840182304382, lr = 0.0001
[10:29:59] INFO - Epoch 40/50, Iter 73600: Loss = 0.03614780306816101, lr = 0.0001
[10:30:36] INFO - Epoch 40/50, Iter 73700: Loss = 0.025453750044107437, lr = 0.0001
[10:31:14] INFO - Epoch 40/50, Iter 73800: Loss = 0.02823317050933838, lr = 0.0001
[10:31:52] INFO - Epoch 40/50, Iter 73900: Loss = 0.0226666908711195, lr = 0.0001
[10:33:40] INFO - Epoch 40/50, Iter 74000: Loss = 0.022746136412024498, lr = 0.0001
[10:34:17] INFO - Epoch 40/50, Iter 74100: Loss = 0.01721629686653614, lr = 0.0001
[10:34:55] INFO - Epoch 40/50, Iter 74200: Loss = 0.02461112290620804, lr = 0.0001
[10:35:32] INFO - Epoch 40/50, Iter 74300: Loss = 0.024060944095253944, lr = 0.0001
[10:36:10] INFO - Epoch 40/50, Iter 74400: Loss = 0.021712781861424446, lr = 0.0001
[10:36:46] INFO - Epoch 40/50, Iter 74500: Loss = 0.015306558459997177, lr = 0.0001
[10:37:21] INFO - Epoch 40/50, Iter 74600: Loss = 0.030041517689824104, lr = 0.0001
[10:37:56] INFO - Epoch 40/50, Iter 74700: Loss = 0.01286664605140686, lr = 0.0001
[10:38:33] INFO - Epoch 40/50, Iter 74800: Loss = 0.03005480021238327, lr = 0.0001
[10:39:11] INFO - Epoch 40/50, Iter 74900: Loss = 0.017003972083330154, lr = 0.0001
[10:40:57] INFO - Epoch 41/50, Iter 75000: Loss = 0.014750601723790169, lr = 0.0001
[10:41:35] INFO - Epoch 41/50, Iter 75100: Loss = 0.027623731642961502, lr = 0.0001
[10:42:12] INFO - Epoch 41/50, Iter 75200: Loss = 0.02428785338997841, lr = 0.0001
[10:42:49] INFO - Epoch 41/50, Iter 75300: Loss = 0.020127184689044952, lr = 0.0001
[10:43:27] INFO - Epoch 41/50, Iter 75400: Loss = 0.020427513867616653, lr = 0.0001
[10:44:04] INFO - Epoch 41/50, Iter 75500: Loss = 0.015857383608818054, lr = 0.0001
[10:44:41] INFO - Epoch 41/50, Iter 75600: Loss = 0.023515712469816208, lr = 0.0001
[10:45:16] INFO - Epoch 41/50, Iter 75700: Loss = 0.021348096430301666, lr = 0.0001
[10:45:52] INFO - Epoch 41/50, Iter 75800: Loss = 0.021761475130915642, lr = 0.0001
[10:46:30] INFO - Epoch 41/50, Iter 75900: Loss = 0.02231479063630104, lr = 0.0001
[10:48:19] INFO - Epoch 41/50, Iter 76000: Loss = 0.020590530708432198, lr = 0.0001
[10:48:56] INFO - Epoch 41/50, Iter 76100: Loss = 0.025658369064331055, lr = 0.0001
[10:49:34] INFO - Epoch 41/50, Iter 76200: Loss = 0.018263330683112144, lr = 0.0001
[10:50:11] INFO - Epoch 41/50, Iter 76300: Loss = 0.02799496240913868, lr = 0.0001
[10:50:49] INFO - Epoch 41/50, Iter 76400: Loss = 0.020270638167858124, lr = 0.0001
[10:51:26] INFO - Epoch 41/50, Iter 76500: Loss = 0.025936413556337357, lr = 0.0001
[10:52:03] INFO - Epoch 41/50, Iter 76600: Loss = 0.012957521714270115, lr = 0.0001
[10:52:38] INFO - Epoch 41/50, Iter 76700: Loss = 0.014417669735848904, lr = 0.0001
[10:53:13] INFO - Epoch 41/50, Iter 76800: Loss = 0.01625163108110428, lr = 0.0001
[10:53:51] INFO - Epoch 42/50, Iter 76900: Loss = 0.022058110684156418, lr = 0.0001
[10:55:36] INFO - Epoch 42/50, Iter 77000: Loss = 0.017570260912179947, lr = 0.0001
[10:56:13] INFO - Epoch 42/50, Iter 77100: Loss = 0.020291034132242203, lr = 0.0001
[10:56:50] INFO - Epoch 42/50, Iter 77200: Loss = 0.035155974328517914, lr = 0.0001
[10:57:27] INFO - Epoch 42/50, Iter 77300: Loss = 0.03369952365756035, lr = 0.0001
[10:58:04] INFO - Epoch 42/50, Iter 77400: Loss = 0.032326798886060715, lr = 0.0001
[10:58:40] INFO - Epoch 42/50, Iter 77500: Loss = 0.018110264092683792, lr = 0.0001
[10:59:17] INFO - Epoch 42/50, Iter 77600: Loss = 0.018036026507616043, lr = 0.0001
[10:59:54] INFO - Epoch 42/50, Iter 77700: Loss = 0.019200392067432404, lr = 0.0001
[11:00:28] INFO - Epoch 42/50, Iter 77800: Loss = 0.0195014625787735, lr = 0.0001
[11:01:03] INFO - Epoch 42/50, Iter 77900: Loss = 0.023430032655596733, lr = 0.0001
[11:02:51] INFO - Epoch 42/50, Iter 78000: Loss = 0.02310262620449066, lr = 0.0001
[11:03:28] INFO - Epoch 42/50, Iter 78100: Loss = 0.02130754664540291, lr = 0.0001
[11:04:06] INFO - Epoch 42/50, Iter 78200: Loss = 0.01928720250725746, lr = 0.0001
[11:04:43] INFO - Epoch 42/50, Iter 78300: Loss = 0.017581766471266747, lr = 0.0001
[11:05:21] INFO - Epoch 42/50, Iter 78400: Loss = 0.021702248603105545, lr = 0.0001
[11:05:58] INFO - Epoch 42/50, Iter 78500: Loss = 0.022716041654348373, lr = 0.0001
[11:06:35] INFO - Epoch 42/50, Iter 78600: Loss = 0.026689473539590836, lr = 0.0001
[11:07:13] INFO - Epoch 42/50, Iter 78700: Loss = 0.025399215519428253, lr = 0.0001
[11:07:49] INFO - Epoch 43/50, Iter 78800: Loss = 0.023977046832442284, lr = 0.0001
[11:08:25] INFO - Epoch 43/50, Iter 78900: Loss = 0.03005555458366871, lr = 0.0001
[11:10:10] INFO - Epoch 43/50, Iter 79000: Loss = 0.022378981113433838, lr = 0.0001
[11:10:46] INFO - Epoch 43/50, Iter 79100: Loss = 0.025676846504211426, lr = 0.0001
[11:11:23] INFO - Epoch 43/50, Iter 79200: Loss = 0.018473926931619644, lr = 0.0001
[11:12:00] INFO - Epoch 43/50, Iter 79300: Loss = 0.029371149837970734, lr = 0.0001
[11:12:37] INFO - Epoch 43/50, Iter 79400: Loss = 0.015338984318077564, lr = 0.0001
[11:13:14] INFO - Epoch 43/50, Iter 79500: Loss = 0.030672969296574593, lr = 0.0001
[11:13:50] INFO - Epoch 43/50, Iter 79600: Loss = 0.013775693252682686, lr = 0.0001
[11:14:27] INFO - Epoch 43/50, Iter 79700: Loss = 0.028863955289125443, lr = 0.0001
[11:15:04] INFO - Epoch 43/50, Iter 79800: Loss = 0.027279574424028397, lr = 0.0001
[11:15:39] INFO - Epoch 43/50, Iter 79900: Loss = 0.02491520531475544, lr = 0.0001
[11:17:23] INFO - Epoch 43/50, Iter 80000: Loss = 0.022316288203001022, lr = 0.0001
[11:18:01] INFO - Epoch 43/50, Iter 80100: Loss = 0.02023676037788391, lr = 0.0001
[11:18:38] INFO - Epoch 43/50, Iter 80200: Loss = 0.020290840417146683, lr = 0.0001
[11:19:16] INFO - Epoch 43/50, Iter 80300: Loss = 0.01622021570801735, lr = 0.0001
[11:19:53] INFO - Epoch 43/50, Iter 80400: Loss = 0.021102596074342728, lr = 0.0001
[11:20:31] INFO - Epoch 43/50, Iter 80500: Loss = 0.029457077383995056, lr = 0.0001
[11:21:08] INFO - Epoch 43/50, Iter 80600: Loss = 0.024694763123989105, lr = 0.0001
[11:21:47] INFO - Epoch 44/50, Iter 80700: Loss = 0.012608902528882027, lr = 0.0001
[11:22:24] INFO - Epoch 44/50, Iter 80800: Loss = 0.024759817868471146, lr = 0.0001
[11:23:01] INFO - Epoch 44/50, Iter 80900: Loss = 0.027624113485217094, lr = 0.0001
[11:24:44] INFO - Epoch 44/50, Iter 81000: Loss = 0.02646869421005249, lr = 0.0001
[11:25:22] INFO - Epoch 44/50, Iter 81100: Loss = 0.017517074942588806, lr = 0.0001
[11:25:59] INFO - Epoch 44/50, Iter 81200: Loss = 0.009943831712007523, lr = 0.0001
[11:26:37] INFO - Epoch 44/50, Iter 81300: Loss = 0.015972964465618134, lr = 0.0001
[11:27:14] INFO - Epoch 44/50, Iter 81400: Loss = 0.017368219792842865, lr = 0.0001
[11:27:51] INFO - Epoch 44/50, Iter 81500: Loss = 0.018138565123081207, lr = 0.0001
[11:28:29] INFO - Epoch 44/50, Iter 81600: Loss = 0.02059100940823555, lr = 0.0001
[11:29:06] INFO - Epoch 44/50, Iter 81700: Loss = 0.017378471791744232, lr = 0.0001
[11:29:44] INFO - Epoch 44/50, Iter 81800: Loss = 0.023443616926670074, lr = 0.0001
[11:30:21] INFO - Epoch 44/50, Iter 81900: Loss = 0.024056710302829742, lr = 0.0001
[11:32:03] INFO - Epoch 44/50, Iter 82000: Loss = 0.015559646300971508, lr = 0.0001
[11:32:41] INFO - Epoch 44/50, Iter 82100: Loss = 0.015559978783130646, lr = 0.0001
[11:33:18] INFO - Epoch 44/50, Iter 82200: Loss = 0.02814953401684761, lr = 0.0001
[11:33:56] INFO - Epoch 44/50, Iter 82300: Loss = 0.02466312237083912, lr = 0.0001
[11:34:33] INFO - Epoch 44/50, Iter 82400: Loss = 0.017446378245949745, lr = 0.0001
[11:35:11] INFO - Epoch 45/50, Iter 82500: Loss = 0.019831202924251556, lr = 0.0001
[11:35:50] INFO - Epoch 45/50, Iter 82600: Loss = 0.016719266772270203, lr = 0.0001
[11:36:28] INFO - Epoch 45/50, Iter 82700: Loss = 0.01663721725344658, lr = 0.0001
[11:37:05] INFO - Epoch 45/50, Iter 82800: Loss = 0.024095885455608368, lr = 0.0001
[11:37:42] INFO - Epoch 45/50, Iter 82900: Loss = 0.022868715226650238, lr = 0.0001
[11:39:25] INFO - Epoch 45/50, Iter 83000: Loss = 0.022109508514404297, lr = 0.0001
[11:40:02] INFO - Epoch 45/50, Iter 83100: Loss = 0.023459019139409065, lr = 0.0001
[11:40:39] INFO - Epoch 45/50, Iter 83200: Loss = 0.03357243910431862, lr = 0.0001
[11:41:17] INFO - Epoch 45/50, Iter 83300: Loss = 0.01947803422808647, lr = 0.0001
[11:41:54] INFO - Epoch 45/50, Iter 83400: Loss = 0.014463461935520172, lr = 0.0001
[11:42:32] INFO - Epoch 45/50, Iter 83500: Loss = 0.017590757459402084, lr = 0.0001
[11:43:09] INFO - Epoch 45/50, Iter 83600: Loss = 0.012953747063875198, lr = 0.0001
[11:43:47] INFO - Epoch 45/50, Iter 83700: Loss = 0.011775579303503036, lr = 0.0001
[11:44:24] INFO - Epoch 45/50, Iter 83800: Loss = 0.033017270267009735, lr = 0.0001
[11:45:01] INFO - Epoch 45/50, Iter 83900: Loss = 0.012742359191179276, lr = 0.0001
[11:46:45] INFO - Epoch 45/50, Iter 84000: Loss = 0.019268862903118134, lr = 0.0001
[11:47:21] INFO - Epoch 45/50, Iter 84100: Loss = 0.020279936492443085, lr = 0.0001
[11:47:59] INFO - Epoch 45/50, Iter 84200: Loss = 0.01858804188668728, lr = 0.0001
[11:48:36] INFO - Epoch 45/50, Iter 84300: Loss = 0.014711486175656319, lr = 0.0001
[11:49:14] INFO - Epoch 46/50, Iter 84400: Loss = 0.020954683423042297, lr = 0.0001
[11:49:52] INFO - Epoch 46/50, Iter 84500: Loss = 0.02662809006869793, lr = 0.0001
[11:50:30] INFO - Epoch 46/50, Iter 84600: Loss = 0.021922439336776733, lr = 0.0001
[11:51:08] INFO - Epoch 46/50, Iter 84700: Loss = 0.021114500239491463, lr = 0.0001
[11:51:45] INFO - Epoch 46/50, Iter 84800: Loss = 0.017373420298099518, lr = 0.0001
[11:52:23] INFO - Epoch 46/50, Iter 84900: Loss = 0.020827889442443848, lr = 0.0001
[11:54:07] INFO - Epoch 46/50, Iter 85000: Loss = 0.0218573696911335, lr = 0.0001
[11:54:42] INFO - Epoch 46/50, Iter 85100: Loss = 0.019245875999331474, lr = 0.0001
[11:55:19] INFO - Epoch 46/50, Iter 85200: Loss = 0.017498616129159927, lr = 0.0001
[11:55:57] INFO - Epoch 46/50, Iter 85300: Loss = 0.0184156596660614, lr = 0.0001
[11:56:34] INFO - Epoch 46/50, Iter 85400: Loss = 0.02401101216673851, lr = 0.0001
[11:57:12] INFO - Epoch 46/50, Iter 85500: Loss = 0.018305890262126923, lr = 0.0001
[11:57:49] INFO - Epoch 46/50, Iter 85600: Loss = 0.03495640307664871, lr = 0.0001
[11:58:27] INFO - Epoch 46/50, Iter 85700: Loss = 0.021866515278816223, lr = 0.0001
[11:59:04] INFO - Epoch 46/50, Iter 85800: Loss = 0.035283900797367096, lr = 0.0001
[11:59:42] INFO - Epoch 46/50, Iter 85900: Loss = 0.020653875544667244, lr = 0.0001
[12:01:28] INFO - Epoch 46/50, Iter 86000: Loss = 0.016537442803382874, lr = 0.0001
[12:02:03] INFO - Epoch 46/50, Iter 86100: Loss = 0.0210992731153965, lr = 0.0001
[12:02:39] INFO - Epoch 46/50, Iter 86200: Loss = 0.023491602391004562, lr = 0.0001
[12:03:17] INFO - Epoch 47/50, Iter 86300: Loss = 0.02632911317050457, lr = 0.0001
[12:03:55] INFO - Epoch 47/50, Iter 86400: Loss = 0.022847235202789307, lr = 0.0001
[12:04:33] INFO - Epoch 47/50, Iter 86500: Loss = 0.018759798258543015, lr = 0.0001
[12:05:11] INFO - Epoch 47/50, Iter 86600: Loss = 0.01871965453028679, lr = 0.0001
[12:05:49] INFO - Epoch 47/50, Iter 86700: Loss = 0.01559593714773655, lr = 0.0001
[12:06:26] INFO - Epoch 47/50, Iter 86800: Loss = 0.021482981741428375, lr = 0.0001
[12:07:03] INFO - Epoch 47/50, Iter 86900: Loss = 0.01850007474422455, lr = 0.0001
[12:08:50] INFO - Epoch 47/50, Iter 87000: Loss = 0.016197603195905685, lr = 0.0001
[12:09:25] INFO - Epoch 47/50, Iter 87100: Loss = 0.0179985873401165, lr = 0.0001
[12:09:59] INFO - Epoch 47/50, Iter 87200: Loss = 0.017149612307548523, lr = 0.0001
[12:10:36] INFO - Epoch 47/50, Iter 87300: Loss = 0.019468747079372406, lr = 0.0001
[12:11:14] INFO - Epoch 47/50, Iter 87400: Loss = 0.022250430658459663, lr = 0.0001
[12:11:51] INFO - Epoch 47/50, Iter 87500: Loss = 0.02432246319949627, lr = 0.0001
[12:12:29] INFO - Epoch 47/50, Iter 87600: Loss = 0.016115814447402954, lr = 0.0001
[12:13:06] INFO - Epoch 47/50, Iter 87700: Loss = 0.016428790986537933, lr = 0.0001
[12:13:44] INFO - Epoch 47/50, Iter 87800: Loss = 0.027514930814504623, lr = 0.0001
[12:14:21] INFO - Epoch 47/50, Iter 87900: Loss = 0.020233802497386932, lr = 0.0001
[12:16:09] INFO - Epoch 47/50, Iter 88000: Loss = 0.019230294972658157, lr = 0.0001
[12:16:45] INFO - Epoch 47/50, Iter 88100: Loss = 0.026008252054452896, lr = 0.0001
[12:17:21] INFO - Epoch 48/50, Iter 88200: Loss = 0.022319599986076355, lr = 0.0001
[12:17:57] INFO - Epoch 48/50, Iter 88300: Loss = 0.015480638481676579, lr = 0.0001
[12:18:35] INFO - Epoch 48/50, Iter 88400: Loss = 0.02278859168291092, lr = 0.0001
[12:19:14] INFO - Epoch 48/50, Iter 88500: Loss = 0.017225494608283043, lr = 0.0001
[12:19:52] INFO - Epoch 48/50, Iter 88600: Loss = 0.024317804723978043, lr = 0.0001
[12:20:29] INFO - Epoch 48/50, Iter 88700: Loss = 0.020604224875569344, lr = 0.0001
[12:21:06] INFO - Epoch 48/50, Iter 88800: Loss = 0.01731717586517334, lr = 0.0001
[12:21:44] INFO - Epoch 48/50, Iter 88900: Loss = 0.018329227343201637, lr = 0.0001
[12:23:30] INFO - Epoch 48/50, Iter 89000: Loss = 0.018779577687382698, lr = 0.0001
[12:24:07] INFO - Epoch 48/50, Iter 89100: Loss = 0.028485845774412155, lr = 0.0001
[12:24:42] INFO - Epoch 48/50, Iter 89200: Loss = 0.022587072104215622, lr = 0.0001
[12:25:17] INFO - Epoch 48/50, Iter 89300: Loss = 0.02194858342409134, lr = 0.0001
[12:25:53] INFO - Epoch 48/50, Iter 89400: Loss = 0.016873138025403023, lr = 0.0001
[12:26:31] INFO - Epoch 48/50, Iter 89500: Loss = 0.024464264512062073, lr = 0.0001
[12:27:08] INFO - Epoch 48/50, Iter 89600: Loss = 0.02444087527692318, lr = 0.0001
[12:27:46] INFO - Epoch 48/50, Iter 89700: Loss = 0.01770823448896408, lr = 0.0001
[12:28:23] INFO - Epoch 48/50, Iter 89800: Loss = 0.019991975277662277, lr = 0.0001
[12:29:00] INFO - Epoch 48/50, Iter 89900: Loss = 0.022915782406926155, lr = 0.0001
[12:30:49] INFO - Epoch 49/50, Iter 90000: Loss = 0.02480982430279255, lr = 0.0001
[12:31:27] INFO - Epoch 49/50, Iter 90100: Loss = 0.018983453512191772, lr = 0.0001
[12:32:04] INFO - Epoch 49/50, Iter 90200: Loss = 0.018778514117002487, lr = 0.0001
[12:32:39] INFO - Epoch 49/50, Iter 90300: Loss = 0.018759869039058685, lr = 0.0001
[12:33:15] INFO - Epoch 49/50, Iter 90400: Loss = 0.020022587850689888, lr = 0.0001
[12:33:53] INFO - Epoch 49/50, Iter 90500: Loss = 0.02239784598350525, lr = 0.0001
[12:34:31] INFO - Epoch 49/50, Iter 90600: Loss = 0.021786922588944435, lr = 0.0001
[12:35:08] INFO - Epoch 49/50, Iter 90700: Loss = 0.021193988621234894, lr = 0.0001
[12:35:46] INFO - Epoch 49/50, Iter 90800: Loss = 0.019572975113987923, lr = 0.0001
[12:36:23] INFO - Epoch 49/50, Iter 90900: Loss = 0.016485311090946198, lr = 0.0001
[12:38:09] INFO - Epoch 49/50, Iter 91000: Loss = 0.021967381238937378, lr = 0.0001
[12:38:46] INFO - Epoch 49/50, Iter 91100: Loss = 0.018237147480249405, lr = 0.0001
[12:39:23] INFO - Epoch 49/50, Iter 91200: Loss = 0.01905180886387825, lr = 0.0001
[12:39:59] INFO - Epoch 49/50, Iter 91300: Loss = 0.02382483333349228, lr = 0.0001
[12:40:33] INFO - Epoch 49/50, Iter 91400: Loss = 0.02098831906914711, lr = 0.0001
[12:41:09] INFO - Epoch 49/50, Iter 91500: Loss = 0.02765822224318981, lr = 0.0001
[12:41:47] INFO - Epoch 49/50, Iter 91600: Loss = 0.023272905498743057, lr = 0.0001
[12:42:24] INFO - Epoch 49/50, Iter 91700: Loss = 0.02188965119421482, lr = 0.0001
[12:43:02] INFO - Epoch 49/50, Iter 91800: Loss = 0.026097562164068222, lr = 0.0001
[12:43:40] INFO - Epoch 50/50, Iter 91900: Loss = 0.018962332978844643, lr = 0.0001
[12:45:28] INFO - Epoch 50/50, Iter 92000: Loss = 0.02291695959866047, lr = 0.0001
[12:46:05] INFO - Epoch 50/50, Iter 92100: Loss = 0.033082619309425354, lr = 0.0001
[12:46:43] INFO - Epoch 50/50, Iter 92200: Loss = 0.030323170125484467, lr = 0.0001
[12:47:20] INFO - Epoch 50/50, Iter 92300: Loss = 0.022696129977703094, lr = 0.0001
[12:47:55] INFO - Epoch 50/50, Iter 92400: Loss = 0.020445533096790314, lr = 0.0001
[12:48:29] INFO - Epoch 50/50, Iter 92500: Loss = 0.02273436076939106, lr = 0.0001
[12:49:07] INFO - Epoch 50/50, Iter 92600: Loss = 0.021798046305775642, lr = 0.0001
[12:49:43] INFO - Epoch 50/50, Iter 92700: Loss = 0.02120419591665268, lr = 0.0001
[12:50:20] INFO - Epoch 50/50, Iter 92800: Loss = 0.027433019131422043, lr = 0.0001
[12:50:57] INFO - Epoch 50/50, Iter 92900: Loss = 0.025116585195064545, lr = 0.0001
[12:52:42] INFO - Epoch 50/50, Iter 93000: Loss = 0.02106088027358055, lr = 0.0001
[12:53:19] INFO - Epoch 50/50, Iter 93100: Loss = 0.016250556334853172, lr = 0.0001
[12:53:56] INFO - Epoch 50/50, Iter 93200: Loss = 0.016655270010232925, lr = 0.0001
[12:54:33] INFO - Epoch 50/50, Iter 93300: Loss = 0.020460784435272217, lr = 0.0001
[12:55:10] INFO - Epoch 50/50, Iter 93400: Loss = 0.02524268440902233, lr = 0.0001
[12:55:44] INFO - Epoch 50/50, Iter 93500: Loss = 0.01436917670071125, lr = 0.0001
[12:56:19] INFO - Epoch 50/50, Iter 93600: Loss = 0.019781406968832016, lr = 0.0001
[12:56:56] INFO - Epoch 50/50, Iter 93700: Loss = 0.01460881344974041, lr = 0.0001
|