diff --git "a/log/debug_0.log" "b/log/debug_0.log" new file mode 100644--- /dev/null +++ "b/log/debug_0.log" @@ -0,0 +1,15017 @@ +11/06/2021 21:16:12 - INFO - __main__ - Distributed environment: MULTI_GPU Backend: nccl +Num processes: 16 +Process index: 0 +Local process index: 0 +Device: cuda:0 +Use FP16 precision: True + +11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - /home/leandro/codeparrot-small/./ is already a clone of https://huggingface.co/lvwerra/codeparrot-small. Make sure you pull the latest changes with `repo.git_pull()`. +11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - Revision `proud-haze-135` does not exist. Created and checked out branch `proud-haze-135`. +11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - +11/06/2021 21:16:15 - INFO - datasets.data_files - Some files matched the pattern '*' at /home/leandro/codeparrot-clean-train but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/0b/f3/0bf3cd1320065c163f47a112458dc107650e3e862094b703b76073bd0b68663d'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/37/26/3726a0239b5cb7d0ef3ea36886c533d0becc7404217763015559edb546d53c94'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/e7/a9/e7a9ccbfe6bd92476f83eba205c47ed23732ace4c1bd7458d76d666ebbba3b1c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/73/73/737327c2b47693e00050aa3410c5eb402c66211a79740ab57f1c763a1e557563'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2a/7e/2a7e50bbdb90d6c4cec534c3f1dc7ec0e6a0dada15c07cfd94615940c632ce02'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5a/5f/5a5fbc19e0e76787f668ada7235203c10b0cbcdea0ecf8f873f8ec281cfe3494'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/74/31/7431977a8e3a6eb0348b821009495f85d9373c1f730f4a74b0db43326568f77d'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/50/38/503872def2ac44733fbefc2602ab16224caca0896aa1eba045025ef2d60efcdc'), PosixPath('/home/leandro/codeparrot-clean-train/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b6/ce/b6ce495492aedfc91b66efdfd214b2dfe44867c719d51590e1868e42f4e9b6dd'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/df/08/df0840d1657530c8fa9f82864be5999c515f54341d926c430a82528a6bb83740'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2f/62/2f628d890bceee216f87edb3c45d2e384ee2501ce41a4c4169efaa3363bef1d2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/0f/7a/0f7a67cd83c1c069995f0f2510ebf818dcc71d9658f189de1231d2b7aac8883c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/05/39/053944e1daead0b6de8e46ea2e0bc68b9247604c63a55d444ac3b9adb12e2cd2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/dc/ac/dcacb03d8f43f7879c5eab4422644d7b3797b47dbb0c9c84d88cbc85822d8306'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ac/e3/ace3ac440b380d604ab198cf8e838a2a375e7b0a6b5699ec74a8c79648f4bab8'), PosixPath('/home/leandro/codeparrot-clean-train/.git/description'), PosixPath('/home/leandro/codeparrot-clean-train/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/d4/9f/d49f1929644619c39cff677367ff2e18223a8046ec8f61e224954a10aa2ccf8f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2e/aa/2eaa21b832ed1496fb7f0b259666dbfc36ed483d81494d1e8705f9d601509c12'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/f1/a7/f1a7a250e1f6164a7fb602131ff54b69deb305258792f2358075403769d58fe5'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/d0/02/d0024828eece6d4d1c25cb4e539328be97fa28ce66a3b8d2374a117711cfd520'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/90/a5/90a573501de640c3e0e6f1b3508306febc96faf6061bb33c67894c168a1879c6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5d/42/5d42ba9f195510757a3699005a7c43ddede4b598caf8a5f2f8c84d1125fa6324'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5f/d1/5fd1bb56db810b65d1fd3866dc43d9c7b690c8f52b9ca8119b2a5f4c49d13eec'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/7c/0e/7c0ef87edb0e556939282c859c7c893a91b5b0f931394ca4cca4f4ec98a61951'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ee/c1/eec1a9546aac0444a706c09f6aab67cd64403940657417e30212b7ff1e16665c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/55/b6/55b6989a41ae296337356153e6081c61484d0b6734b6905683823e7317d01c42'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/cc/58/cc58b22515c4fd7d891287ee717c2054290b20c17b1c34693fd8964ab730687b'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b6/8a/b68a74f9784402dcb311f4db72a873035e47b98b185a1813ab2c1645cb7255a2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/fb/84/fb84ca8000808f62718994e4b44e79d88a05b345e9638d9f6cf6c8a5472da01f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/objects/pack/pack-12438cb8112d3b4104fefcb88d751872b5e0fd6e.pack'), PosixPath('/home/leandro/codeparrot-clean-train/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/12/8d/128d56e09d9d741b2778d733e595838a50a5e82fdc9adbb0aa8645457716b97e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/objects/pack/pack-12438cb8112d3b4104fefcb88d751872b5e0fd6e.idx'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b4/83/b4836655e350f0796acd2b1a206e657c2808d9f136afae095e0b94a790c704e1'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/3e/f2/3ef240d0b394384803ae1bbe3b30974e11eb9b1b6ad4f49afc2ed0f7c9eae0d6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/14/08/14089cad26037080ee900bede2fd42d5cac70738b2e77402b36681e1d2a521f6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/86/0e/860eda34e90456533e9dd41a5c0fdb74c54dc8d9cf43d6c60b887b2c858be831'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/15/ac/15ac016e4cd702bb184457cbf5674d71b632fc34c29611ba4de549b85c67acfb'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/a4/6b/a46b5c08d39691524b46fadf78eab5efefa29978edfee799ec3587d928dc1302'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/fa/e6/fae6b44a24c1c35f15053a19a6b2b2af5cc9fb8bdaf0da409068a2a1f333f28e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/17/5e/175e7375d6f65993071aa653bdd4e8b117cc02d1d2353cd7bcdbaaf7fe8b3c9c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ac/36/ac36d12d37c1dc8ee8d3b8f0eae93966ae73482ef725615bb1a715802ddd4dd4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/17/96/1796f12729d0407cc57500c9c87959e0e7becd729f37374702868ed8765015f4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/67/f1/67f1ff0d590fbf4aa9afa161c290fe9be17538d4b723278bb21fd6408b0e6a3e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/55/c9/55c9c0b2f26de96e0311ee43e8eaa78ad1af387d0c59a26f22c5ebd507dda321'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/config'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/9f/7e/9f7e18a3980d4b3d5ed9469ab7a2d67b608e8aa6fff38d876f86719c8f2a7a82'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/e6/48/e6484a578778beccab26c8549608ec13970e6bcdb9541cdccad20f4d984e8181'), PosixPath('/home/leandro/codeparrot-clean-train/.git/index'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/54/60/5460223b92bb118814a7777a939f4005b7426a7e4a068c193c10d1b86eeb862b'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ae/45/ae45741df674456bc63bad91374d2ba5ef988d33d6e2a322ef0a5ac8af040371'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/60/41/604177fe5560efd99d93091fadab6293afe7cd7d12f81638c301de1c937c1583'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ef/e1/efe1759837b74b5b5ed3df1a09d4c880f9ad20413d958f79d35bf1cb6a2a09d4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/32/be/32beb30e381ff02fb71854b5534306f395ef00f51f02b62da1f027c8c7fab26f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/9b/1b/9b1b8e52b9262f03f1719d3950dc8dfa2b9719dc2e273603023f6f329c1b2068'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/56/80/56803c607a19ccb576c90bdb10a02cfa7b3affc67dd150fa41b00cc22213b174'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/4e/39/4e392fcaae564652d234d07b4f71eeed90efe51b1b714831e39d77f3e537d3df'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/cd/33/cd339656799518495d23aedf1503459be6d3086e22672e80edab8403d12ded1c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/f1/62/f162b06b5dca01aa85ef9a675d396c0fbab1d009b5bee1c5b7ea6b415c6f12a4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-merge')] +11/06/2021 21:16:15 - WARNING - datasets.builder - Using custom data configuration codeparrot-clean-train-e839c6c1585da466 +11/06/2021 21:16:15 - INFO - datasets.data_files - Some files matched the pattern '*' at /home/leandro/codeparrot-clean-valid but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/60/0dc2964cf471fa4aac706659009777cf176497'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/95/7b2579c6ef20995a09efd9a17f8fd90606f5ed'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/config'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/index'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/25/747fcf966f2b7b3a2f4149130bff69ebe83718'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/15/4f5f07c68026fb069c4bdfe3966893737035f4'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/6d/d1188965fcd7feab0efc3506668a615805e13f'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/description'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/d9/cd7ad451bcd8a388471b341a961d0e6e6ff558'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/55/36bbd68dd8f283092b22eb77a051175c1b727a'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/lfs/objects/7f/8c/7f8c20a737c9084779bcdb853325ad4774d0db52c74aa2a63fd658d6787eb35b'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/09/e6a70d1aadc53ed29b9890332f184f89d0a39b'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/5e/d5325308cb9a07b2c5807dad51120c9a75b6db'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-receive.sample')] +11/06/2021 21:16:15 - WARNING - datasets.builder - Using custom data configuration codeparrot-clean-valid-ced470bd23403144 +11/06/2021 21:16:43 - INFO - __main__ - Step 1: {'lr': 0.0, 'samples': 192, 'steps': 0, 'loss/train': 10.55798625946045} +11/06/2021 21:16:43 - INFO - root - Reducer buckets have been rebuilt in this iteration. +11/06/2021 21:16:43 - INFO - __main__ - Step 2: {'lr': 2.5e-07, 'samples': 384, 'steps': 1, 'loss/train': 10.535750389099121} +11/06/2021 21:16:43 - INFO - __main__ - Step 3: {'lr': 5e-07, 'samples': 576, 'steps': 2, 'loss/train': 10.530282974243164} +11/06/2021 21:16:44 - INFO - __main__ - Step 4: {'lr': 7.5e-07, 'samples': 768, 'steps': 3, 'loss/train': 10.527787208557129} +11/06/2021 21:16:45 - INFO - __main__ - Step 5: {'lr': 1e-06, 'samples': 960, 'steps': 4, 'loss/train': 10.491048812866211} +11/06/2021 21:16:46 - INFO - __main__ - Step 6: {'lr': 1.25e-06, 'samples': 1152, 'steps': 5, 'loss/train': 10.409588813781738} +11/06/2021 21:16:46 - INFO - __main__ - Step 7: {'lr': 1.5e-06, 'samples': 1344, 'steps': 6, 'loss/train': 10.350728034973145} +11/06/2021 21:16:46 - INFO - __main__ - Step 8: {'lr': 1.75e-06, 'samples': 1536, 'steps': 7, 'loss/train': 10.252238273620605} +11/06/2021 21:16:47 - INFO - __main__ - Step 9: {'lr': 2e-06, 'samples': 1728, 'steps': 8, 'loss/train': 10.193534851074219} +11/06/2021 21:16:47 - INFO - __main__ - Step 10: {'lr': 2.25e-06, 'samples': 1920, 'steps': 9, 'loss/train': 9.953790664672852} +11/06/2021 21:16:48 - INFO - __main__ - Step 11: {'lr': 2.5e-06, 'samples': 2112, 'steps': 10, 'loss/train': 10.194929122924805} +11/06/2021 21:16:49 - INFO - __main__ - Step 12: {'lr': 2.75e-06, 'samples': 2304, 'steps': 11, 'loss/train': 9.89802074432373} +11/06/2021 21:16:49 - INFO - __main__ - Step 13: {'lr': 3e-06, 'samples': 2496, 'steps': 12, 'loss/train': 9.843729972839355} +11/06/2021 21:16:49 - INFO - __main__ - Step 14: {'lr': 3.25e-06, 'samples': 2688, 'steps': 13, 'loss/train': 9.845044136047363} +11/06/2021 21:16:50 - INFO - __main__ - Step 15: {'lr': 3.5e-06, 'samples': 2880, 'steps': 14, 'loss/train': 9.869210243225098} +11/06/2021 21:16:51 - INFO - __main__ - Step 16: {'lr': 3.75e-06, 'samples': 3072, 'steps': 15, 'loss/train': 9.587459564208984} +11/06/2021 21:16:51 - INFO - __main__ - Step 17: {'lr': 4e-06, 'samples': 3264, 'steps': 16, 'loss/train': 9.667202949523926} +11/06/2021 21:16:51 - INFO - __main__ - Step 18: {'lr': 4.250000000000001e-06, 'samples': 3456, 'steps': 17, 'loss/train': 9.495230674743652} +11/06/2021 21:16:52 - INFO - __main__ - Step 19: {'lr': 4.5e-06, 'samples': 3648, 'steps': 18, 'loss/train': 9.640376091003418} +11/06/2021 21:16:52 - INFO - __main__ - Step 20: {'lr': 4.75e-06, 'samples': 3840, 'steps': 19, 'loss/train': 9.428448677062988} +11/06/2021 21:16:52 - INFO - __main__ - Step 21: {'lr': 5e-06, 'samples': 4032, 'steps': 20, 'loss/train': 9.341026306152344} +11/06/2021 21:16:54 - INFO - __main__ - Step 22: {'lr': 5.2500000000000006e-06, 'samples': 4224, 'steps': 21, 'loss/train': 9.372577667236328} +11/06/2021 21:16:54 - INFO - __main__ - Step 23: {'lr': 5.5e-06, 'samples': 4416, 'steps': 22, 'loss/train': 8.967851638793945} +11/06/2021 21:16:54 - INFO - __main__ - Step 24: {'lr': 5.75e-06, 'samples': 4608, 'steps': 23, 'loss/train': 8.74506950378418} +11/06/2021 21:16:55 - INFO - __main__ - Step 25: {'lr': 6e-06, 'samples': 4800, 'steps': 24, 'loss/train': 9.786674499511719} +11/06/2021 21:16:55 - INFO - __main__ - Step 26: {'lr': 6.25e-06, 'samples': 4992, 'steps': 25, 'loss/train': 9.504456520080566} +11/06/2021 21:16:56 - INFO - __main__ - Step 27: {'lr': 6.5e-06, 'samples': 5184, 'steps': 26, 'loss/train': 9.166744232177734} +11/06/2021 21:16:56 - INFO - __main__ - Step 28: {'lr': 6.75e-06, 'samples': 5376, 'steps': 27, 'loss/train': 8.682860374450684} +11/06/2021 21:16:57 - INFO - __main__ - Step 29: {'lr': 7e-06, 'samples': 5568, 'steps': 28, 'loss/train': 8.596318244934082} +11/06/2021 21:16:57 - INFO - __main__ - Step 30: {'lr': 7.250000000000001e-06, 'samples': 5760, 'steps': 29, 'loss/train': 9.048979759216309} +11/06/2021 21:16:57 - INFO - __main__ - Step 31: {'lr': 7.5e-06, 'samples': 5952, 'steps': 30, 'loss/train': 9.320890426635742} +11/06/2021 21:16:58 - INFO - __main__ - Step 32: {'lr': 7.75e-06, 'samples': 6144, 'steps': 31, 'loss/train': 8.952228546142578} +11/06/2021 21:16:59 - INFO - __main__ - Step 33: {'lr': 8e-06, 'samples': 6336, 'steps': 32, 'loss/train': 8.751225471496582} +11/06/2021 21:16:59 - INFO - __main__ - Step 34: {'lr': 8.25e-06, 'samples': 6528, 'steps': 33, 'loss/train': 9.156981468200684} +11/06/2021 21:17:00 - INFO - __main__ - Step 35: {'lr': 8.500000000000002e-06, 'samples': 6720, 'steps': 34, 'loss/train': 8.837956428527832} +11/06/2021 21:17:00 - INFO - __main__ - Step 36: {'lr': 8.750000000000001e-06, 'samples': 6912, 'steps': 35, 'loss/train': 8.935142517089844} +11/06/2021 21:17:01 - INFO - __main__ - Step 37: {'lr': 9e-06, 'samples': 7104, 'steps': 36, 'loss/train': 9.019933700561523} +11/06/2021 21:17:02 - INFO - __main__ - Step 38: {'lr': 9.25e-06, 'samples': 7296, 'steps': 37, 'loss/train': 8.594483375549316} +11/06/2021 21:17:02 - INFO - __main__ - Step 39: {'lr': 9.5e-06, 'samples': 7488, 'steps': 38, 'loss/train': 9.565625190734863} +11/06/2021 21:17:02 - INFO - __main__ - Step 40: {'lr': 9.75e-06, 'samples': 7680, 'steps': 39, 'loss/train': 9.195219039916992} +11/06/2021 21:17:03 - INFO - __main__ - Step 41: {'lr': 1e-05, 'samples': 7872, 'steps': 40, 'loss/train': 9.008049011230469} +11/06/2021 21:17:04 - INFO - __main__ - Step 42: {'lr': 1.025e-05, 'samples': 8064, 'steps': 41, 'loss/train': 9.54212760925293} +11/06/2021 21:17:04 - INFO - __main__ - Step 43: {'lr': 1.0500000000000001e-05, 'samples': 8256, 'steps': 42, 'loss/train': 9.074606895446777} +11/06/2021 21:17:04 - INFO - __main__ - Step 44: {'lr': 1.0749999999999999e-05, 'samples': 8448, 'steps': 43, 'loss/train': 9.575305938720703} +11/06/2021 21:17:05 - INFO - __main__ - Step 45: {'lr': 1.1e-05, 'samples': 8640, 'steps': 44, 'loss/train': 9.862631797790527} +11/06/2021 21:17:05 - INFO - __main__ - Step 46: {'lr': 1.1249999999999999e-05, 'samples': 8832, 'steps': 45, 'loss/train': 8.833338737487793} +11/06/2021 21:17:06 - INFO - __main__ - Step 47: {'lr': 1.15e-05, 'samples': 9024, 'steps': 46, 'loss/train': 8.830769538879395} +11/06/2021 21:17:07 - INFO - __main__ - Step 48: {'lr': 1.1750000000000001e-05, 'samples': 9216, 'steps': 47, 'loss/train': 8.828520774841309} +11/06/2021 21:17:07 - INFO - __main__ - Step 49: {'lr': 1.2e-05, 'samples': 9408, 'steps': 48, 'loss/train': 8.692312240600586} +11/06/2021 21:17:07 - INFO - __main__ - Step 50: {'lr': 1.2250000000000001e-05, 'samples': 9600, 'steps': 49, 'loss/train': 8.698874473571777} +11/06/2021 21:17:08 - INFO - __main__ - Step 51: {'lr': 1.25e-05, 'samples': 9792, 'steps': 50, 'loss/train': 8.904641151428223} +11/06/2021 21:17:09 - INFO - __main__ - Step 52: {'lr': 1.275e-05, 'samples': 9984, 'steps': 51, 'loss/train': 8.66476821899414} +11/06/2021 21:17:09 - INFO - __main__ - Step 53: {'lr': 1.3e-05, 'samples': 10176, 'steps': 52, 'loss/train': 8.561541557312012} +11/06/2021 21:17:10 - INFO - __main__ - Step 54: {'lr': 1.325e-05, 'samples': 10368, 'steps': 53, 'loss/train': 8.71354866027832} +11/06/2021 21:17:10 - INFO - __main__ - Step 55: {'lr': 1.35e-05, 'samples': 10560, 'steps': 54, 'loss/train': 8.084650993347168} +11/06/2021 21:17:10 - INFO - __main__ - Step 56: {'lr': 1.375e-05, 'samples': 10752, 'steps': 55, 'loss/train': 8.701323509216309} +11/06/2021 21:17:11 - INFO - __main__ - Step 57: {'lr': 1.4e-05, 'samples': 10944, 'steps': 56, 'loss/train': 8.886054039001465} +11/06/2021 21:17:12 - INFO - __main__ - Step 58: {'lr': 1.425e-05, 'samples': 11136, 'steps': 57, 'loss/train': 8.962408065795898} +11/06/2021 21:17:12 - INFO - __main__ - Step 59: {'lr': 1.4500000000000002e-05, 'samples': 11328, 'steps': 58, 'loss/train': 8.731340408325195} +11/06/2021 21:17:13 - INFO - __main__ - Step 60: {'lr': 1.475e-05, 'samples': 11520, 'steps': 59, 'loss/train': 8.48225212097168} +11/06/2021 21:17:13 - INFO - __main__ - Step 61: {'lr': 1.5e-05, 'samples': 11712, 'steps': 60, 'loss/train': 8.860502243041992} +11/06/2021 21:17:14 - INFO - __main__ - Step 62: {'lr': 1.525e-05, 'samples': 11904, 'steps': 61, 'loss/train': 8.848859786987305} +11/06/2021 21:17:15 - INFO - __main__ - Step 63: {'lr': 1.55e-05, 'samples': 12096, 'steps': 62, 'loss/train': 8.20711612701416} +11/06/2021 21:17:15 - INFO - __main__ - Step 64: {'lr': 1.575e-05, 'samples': 12288, 'steps': 63, 'loss/train': 10.296394348144531} +11/06/2021 21:17:15 - INFO - __main__ - Step 65: {'lr': 1.6e-05, 'samples': 12480, 'steps': 64, 'loss/train': 7.71311092376709} +11/06/2021 21:17:16 - INFO - __main__ - Step 66: {'lr': 1.6250000000000002e-05, 'samples': 12672, 'steps': 65, 'loss/train': 8.466562271118164} +11/06/2021 21:17:16 - INFO - __main__ - Step 67: {'lr': 1.65e-05, 'samples': 12864, 'steps': 66, 'loss/train': 8.35257339477539} +11/06/2021 21:17:17 - INFO - __main__ - Step 68: {'lr': 1.675e-05, 'samples': 13056, 'steps': 67, 'loss/train': 8.386396408081055} +11/06/2021 21:17:18 - INFO - __main__ - Step 69: {'lr': 1.7000000000000003e-05, 'samples': 13248, 'steps': 68, 'loss/train': 8.12002944946289} +11/06/2021 21:17:18 - INFO - __main__ - Step 70: {'lr': 1.7250000000000003e-05, 'samples': 13440, 'steps': 69, 'loss/train': 8.70462417602539} +11/06/2021 21:17:18 - INFO - __main__ - Step 71: {'lr': 1.7500000000000002e-05, 'samples': 13632, 'steps': 70, 'loss/train': 8.239697456359863} +11/06/2021 21:17:19 - INFO - __main__ - Step 72: {'lr': 1.7749999999999998e-05, 'samples': 13824, 'steps': 71, 'loss/train': 7.610179424285889} +11/06/2021 21:17:20 - INFO - __main__ - Step 73: {'lr': 1.8e-05, 'samples': 14016, 'steps': 72, 'loss/train': 7.8869452476501465} +11/06/2021 21:17:20 - INFO - __main__ - Step 74: {'lr': 1.825e-05, 'samples': 14208, 'steps': 73, 'loss/train': 7.692283630371094} +11/06/2021 21:17:21 - INFO - __main__ - Step 75: {'lr': 1.85e-05, 'samples': 14400, 'steps': 74, 'loss/train': 8.208292007446289} +11/06/2021 21:17:21 - INFO - __main__ - Step 76: {'lr': 1.875e-05, 'samples': 14592, 'steps': 75, 'loss/train': 7.97852897644043} +11/06/2021 21:17:21 - INFO - __main__ - Step 77: {'lr': 1.9e-05, 'samples': 14784, 'steps': 76, 'loss/train': 8.777739524841309} +11/06/2021 21:17:22 - INFO - __main__ - Step 78: {'lr': 1.925e-05, 'samples': 14976, 'steps': 77, 'loss/train': 7.68981409072876} +11/06/2021 21:17:23 - INFO - __main__ - Step 79: {'lr': 1.95e-05, 'samples': 15168, 'steps': 78, 'loss/train': 7.656458854675293} +11/06/2021 21:17:23 - INFO - __main__ - Step 80: {'lr': 1.975e-05, 'samples': 15360, 'steps': 79, 'loss/train': 8.30695915222168} +11/06/2021 21:17:23 - INFO - __main__ - Step 81: {'lr': 2e-05, 'samples': 15552, 'steps': 80, 'loss/train': 7.897383689880371} +11/06/2021 21:17:24 - INFO - __main__ - Step 82: {'lr': 2.025e-05, 'samples': 15744, 'steps': 81, 'loss/train': 8.267080307006836} +11/06/2021 21:17:25 - INFO - __main__ - Step 83: {'lr': 2.05e-05, 'samples': 15936, 'steps': 82, 'loss/train': 8.247127532958984} +11/06/2021 21:17:25 - INFO - __main__ - Step 84: {'lr': 2.0750000000000003e-05, 'samples': 16128, 'steps': 83, 'loss/train': 8.18776798248291} +11/06/2021 21:17:25 - INFO - __main__ - Step 85: {'lr': 2.1000000000000002e-05, 'samples': 16320, 'steps': 84, 'loss/train': 7.7213358879089355} +11/06/2021 21:17:26 - INFO - __main__ - Step 86: {'lr': 2.125e-05, 'samples': 16512, 'steps': 85, 'loss/train': 7.880347728729248} +11/06/2021 21:17:26 - INFO - __main__ - Step 87: {'lr': 2.1499999999999997e-05, 'samples': 16704, 'steps': 86, 'loss/train': 8.094650268554688} +11/06/2021 21:17:27 - INFO - __main__ - Step 88: {'lr': 2.175e-05, 'samples': 16896, 'steps': 87, 'loss/train': 7.1267242431640625} +11/06/2021 21:17:27 - INFO - __main__ - Step 89: {'lr': 2.2e-05, 'samples': 17088, 'steps': 88, 'loss/train': 7.992337703704834} +11/06/2021 21:17:28 - INFO - __main__ - Step 90: {'lr': 2.225e-05, 'samples': 17280, 'steps': 89, 'loss/train': 7.918111801147461} +11/06/2021 21:17:28 - INFO - __main__ - Step 91: {'lr': 2.2499999999999998e-05, 'samples': 17472, 'steps': 90, 'loss/train': 7.4610795974731445} +11/06/2021 21:17:29 - INFO - __main__ - Step 92: {'lr': 2.275e-05, 'samples': 17664, 'steps': 91, 'loss/train': 7.861474990844727} +11/06/2021 21:17:29 - INFO - __main__ - Step 93: {'lr': 2.3e-05, 'samples': 17856, 'steps': 92, 'loss/train': 7.493942737579346} +11/06/2021 21:17:30 - INFO - __main__ - Step 94: {'lr': 2.325e-05, 'samples': 18048, 'steps': 93, 'loss/train': 8.051450729370117} +11/06/2021 21:17:30 - INFO - __main__ - Step 95: {'lr': 2.3500000000000002e-05, 'samples': 18240, 'steps': 94, 'loss/train': 7.800515651702881} +11/06/2021 21:17:31 - INFO - __main__ - Step 96: {'lr': 2.375e-05, 'samples': 18432, 'steps': 95, 'loss/train': 7.40056037902832} +11/06/2021 21:17:31 - INFO - __main__ - Step 97: {'lr': 2.4e-05, 'samples': 18624, 'steps': 96, 'loss/train': 7.518774032592773} +11/06/2021 21:17:31 - INFO - __main__ - Step 98: {'lr': 2.425e-05, 'samples': 18816, 'steps': 97, 'loss/train': 7.735995292663574} +11/06/2021 21:17:32 - INFO - __main__ - Step 99: {'lr': 2.4500000000000003e-05, 'samples': 19008, 'steps': 98, 'loss/train': 7.60399866104126} +11/06/2021 21:17:33 - INFO - __main__ - Step 100: {'lr': 2.4750000000000002e-05, 'samples': 19200, 'steps': 99, 'loss/train': 7.875792980194092} +11/06/2021 21:17:33 - INFO - __main__ - Step 101: {'lr': 2.5e-05, 'samples': 19392, 'steps': 100, 'loss/train': 7.704280853271484} +11/06/2021 21:17:34 - INFO - __main__ - Step 102: {'lr': 2.525e-05, 'samples': 19584, 'steps': 101, 'loss/train': 7.629642009735107} +11/06/2021 21:17:34 - INFO - __main__ - Step 103: {'lr': 2.55e-05, 'samples': 19776, 'steps': 102, 'loss/train': 7.427465915679932} +11/06/2021 21:17:35 - INFO - __main__ - Step 104: {'lr': 2.575e-05, 'samples': 19968, 'steps': 103, 'loss/train': 7.325517654418945} +11/06/2021 21:17:35 - INFO - __main__ - Step 105: {'lr': 2.6e-05, 'samples': 20160, 'steps': 104, 'loss/train': 7.825165271759033} +11/06/2021 21:17:36 - INFO - __main__ - Step 106: {'lr': 2.625e-05, 'samples': 20352, 'steps': 105, 'loss/train': 7.557342529296875} +11/06/2021 21:17:36 - INFO - __main__ - Step 107: {'lr': 2.65e-05, 'samples': 20544, 'steps': 106, 'loss/train': 7.5471510887146} +11/06/2021 21:17:36 - INFO - __main__ - Step 108: {'lr': 2.675e-05, 'samples': 20736, 'steps': 107, 'loss/train': 7.51965856552124} +11/06/2021 21:17:37 - INFO - __main__ - Step 109: {'lr': 2.7e-05, 'samples': 20928, 'steps': 108, 'loss/train': 7.727786540985107} +11/06/2021 21:17:38 - INFO - __main__ - Step 110: {'lr': 2.725e-05, 'samples': 21120, 'steps': 109, 'loss/train': 8.008770942687988} +11/06/2021 21:17:38 - INFO - __main__ - Step 111: {'lr': 2.75e-05, 'samples': 21312, 'steps': 110, 'loss/train': 7.874051094055176} +11/06/2021 21:17:38 - INFO - __main__ - Step 112: {'lr': 2.775e-05, 'samples': 21504, 'steps': 111, 'loss/train': 7.637380599975586} +11/06/2021 21:17:39 - INFO - __main__ - Step 113: {'lr': 2.8e-05, 'samples': 21696, 'steps': 112, 'loss/train': 7.677240371704102} +11/06/2021 21:17:40 - INFO - __main__ - Step 114: {'lr': 2.8250000000000002e-05, 'samples': 21888, 'steps': 113, 'loss/train': 7.03343391418457} +11/06/2021 21:17:40 - INFO - __main__ - Step 115: {'lr': 2.85e-05, 'samples': 22080, 'steps': 114, 'loss/train': 7.615724563598633} +11/06/2021 21:17:41 - INFO - __main__ - Step 116: {'lr': 2.875e-05, 'samples': 22272, 'steps': 115, 'loss/train': 7.741561412811279} +11/06/2021 21:17:41 - INFO - __main__ - Step 117: {'lr': 2.9000000000000004e-05, 'samples': 22464, 'steps': 116, 'loss/train': 8.360411643981934} +11/06/2021 21:17:41 - INFO - __main__ - Step 118: {'lr': 2.9250000000000003e-05, 'samples': 22656, 'steps': 117, 'loss/train': 7.302130222320557} +11/06/2021 21:17:42 - INFO - __main__ - Step 119: {'lr': 2.95e-05, 'samples': 22848, 'steps': 118, 'loss/train': 7.071781158447266} +11/06/2021 21:17:43 - INFO - __main__ - Step 120: {'lr': 2.9749999999999998e-05, 'samples': 23040, 'steps': 119, 'loss/train': 7.1986308097839355} +11/06/2021 21:17:43 - INFO - __main__ - Step 121: {'lr': 3e-05, 'samples': 23232, 'steps': 120, 'loss/train': 6.897414684295654} +11/06/2021 21:17:43 - INFO - __main__ - Step 122: {'lr': 3.025e-05, 'samples': 23424, 'steps': 121, 'loss/train': 6.9648213386535645} +11/06/2021 21:17:44 - INFO - __main__ - Step 123: {'lr': 3.05e-05, 'samples': 23616, 'steps': 122, 'loss/train': 7.184485912322998} +11/06/2021 21:17:45 - INFO - __main__ - Step 124: {'lr': 3.075e-05, 'samples': 23808, 'steps': 123, 'loss/train': 6.945891857147217} +11/06/2021 21:17:45 - INFO - __main__ - Step 125: {'lr': 3.1e-05, 'samples': 24000, 'steps': 124, 'loss/train': 7.381505489349365} +11/06/2021 21:17:46 - INFO - __main__ - Step 126: {'lr': 3.125e-05, 'samples': 24192, 'steps': 125, 'loss/train': 7.457914352416992} +11/06/2021 21:17:46 - INFO - __main__ - Step 127: {'lr': 3.15e-05, 'samples': 24384, 'steps': 126, 'loss/train': 7.405432224273682} +11/06/2021 21:17:47 - INFO - __main__ - Step 128: {'lr': 3.175e-05, 'samples': 24576, 'steps': 127, 'loss/train': 7.172966003417969} +11/06/2021 21:17:48 - INFO - __main__ - Step 129: {'lr': 3.2e-05, 'samples': 24768, 'steps': 128, 'loss/train': 7.367163181304932} +11/06/2021 21:17:48 - INFO - __main__ - Step 130: {'lr': 3.2250000000000005e-05, 'samples': 24960, 'steps': 129, 'loss/train': 6.170543670654297} +11/06/2021 21:17:48 - INFO - __main__ - Step 131: {'lr': 3.2500000000000004e-05, 'samples': 25152, 'steps': 130, 'loss/train': 6.940507411956787} +11/06/2021 21:17:49 - INFO - __main__ - Step 132: {'lr': 3.275e-05, 'samples': 25344, 'steps': 131, 'loss/train': 7.2779364585876465} +11/06/2021 21:17:49 - INFO - __main__ - Step 133: {'lr': 3.3e-05, 'samples': 25536, 'steps': 132, 'loss/train': 6.9434428215026855} +11/06/2021 21:17:49 - INFO - __main__ - Step 134: {'lr': 3.325e-05, 'samples': 25728, 'steps': 133, 'loss/train': 7.035802841186523} +11/06/2021 21:17:50 - INFO - __main__ - Step 135: {'lr': 3.35e-05, 'samples': 25920, 'steps': 134, 'loss/train': 8.246500015258789} +11/06/2021 21:17:51 - INFO - __main__ - Step 136: {'lr': 3.375e-05, 'samples': 26112, 'steps': 135, 'loss/train': 6.835116386413574} +11/06/2021 21:17:51 - INFO - __main__ - Step 137: {'lr': 3.4000000000000007e-05, 'samples': 26304, 'steps': 136, 'loss/train': 6.883285999298096} +11/06/2021 21:17:51 - INFO - __main__ - Step 138: {'lr': 3.4250000000000006e-05, 'samples': 26496, 'steps': 137, 'loss/train': 7.106326103210449} +11/06/2021 21:17:52 - INFO - __main__ - Step 139: {'lr': 3.4500000000000005e-05, 'samples': 26688, 'steps': 138, 'loss/train': 7.33680534362793} +11/06/2021 21:17:53 - INFO - __main__ - Step 140: {'lr': 3.4750000000000004e-05, 'samples': 26880, 'steps': 139, 'loss/train': 6.972182273864746} +11/06/2021 21:17:53 - INFO - __main__ - Step 141: {'lr': 3.5000000000000004e-05, 'samples': 27072, 'steps': 140, 'loss/train': 6.676812171936035} +11/06/2021 21:17:54 - INFO - __main__ - Step 142: {'lr': 3.5249999999999996e-05, 'samples': 27264, 'steps': 141, 'loss/train': 7.476287364959717} +11/06/2021 21:17:54 - INFO - __main__ - Step 143: {'lr': 3.5499999999999996e-05, 'samples': 27456, 'steps': 142, 'loss/train': 6.697681903839111} +11/06/2021 21:17:54 - INFO - __main__ - Step 144: {'lr': 3.5749999999999995e-05, 'samples': 27648, 'steps': 143, 'loss/train': 6.98452091217041} +11/06/2021 21:17:55 - INFO - __main__ - Step 145: {'lr': 3.6e-05, 'samples': 27840, 'steps': 144, 'loss/train': 6.702653408050537} +11/06/2021 21:17:56 - INFO - __main__ - Step 146: {'lr': 3.625e-05, 'samples': 28032, 'steps': 145, 'loss/train': 7.03615140914917} +11/06/2021 21:17:56 - INFO - __main__ - Step 147: {'lr': 3.65e-05, 'samples': 28224, 'steps': 146, 'loss/train': 6.963271617889404} +11/06/2021 21:17:56 - INFO - __main__ - Step 148: {'lr': 3.675e-05, 'samples': 28416, 'steps': 147, 'loss/train': 6.389257907867432} +11/06/2021 21:17:57 - INFO - __main__ - Step 149: {'lr': 3.7e-05, 'samples': 28608, 'steps': 148, 'loss/train': 6.685713768005371} +11/06/2021 21:17:58 - INFO - __main__ - Step 150: {'lr': 3.725e-05, 'samples': 28800, 'steps': 149, 'loss/train': 6.8497772216796875} +11/06/2021 21:17:58 - INFO - __main__ - Step 151: {'lr': 3.75e-05, 'samples': 28992, 'steps': 150, 'loss/train': 6.36531925201416} +11/06/2021 21:17:59 - INFO - __main__ - Step 152: {'lr': 3.775e-05, 'samples': 29184, 'steps': 151, 'loss/train': 6.523715019226074} +11/06/2021 21:17:59 - INFO - __main__ - Step 153: {'lr': 3.8e-05, 'samples': 29376, 'steps': 152, 'loss/train': 7.334853172302246} +11/06/2021 21:17:59 - INFO - __main__ - Step 154: {'lr': 3.825e-05, 'samples': 29568, 'steps': 153, 'loss/train': 6.311091423034668} +11/06/2021 21:18:00 - INFO - __main__ - Step 155: {'lr': 3.85e-05, 'samples': 29760, 'steps': 154, 'loss/train': 6.930693626403809} +11/06/2021 21:18:01 - INFO - __main__ - Step 156: {'lr': 3.875e-05, 'samples': 29952, 'steps': 155, 'loss/train': 7.10976505279541} +11/06/2021 21:18:01 - INFO - __main__ - Step 157: {'lr': 3.9e-05, 'samples': 30144, 'steps': 156, 'loss/train': 6.257956504821777} +11/06/2021 21:18:01 - INFO - __main__ - Step 158: {'lr': 3.925e-05, 'samples': 30336, 'steps': 157, 'loss/train': 6.675495624542236} +11/06/2021 21:18:02 - INFO - __main__ - Step 159: {'lr': 3.95e-05, 'samples': 30528, 'steps': 158, 'loss/train': 6.756046295166016} +11/06/2021 21:18:03 - INFO - __main__ - Step 160: {'lr': 3.9750000000000004e-05, 'samples': 30720, 'steps': 159, 'loss/train': 7.092185020446777} +11/06/2021 21:18:03 - INFO - __main__ - Step 161: {'lr': 4e-05, 'samples': 30912, 'steps': 160, 'loss/train': 6.609521389007568} +11/06/2021 21:18:04 - INFO - __main__ - Step 162: {'lr': 4.025e-05, 'samples': 31104, 'steps': 161, 'loss/train': 6.6135945320129395} +11/06/2021 21:18:04 - INFO - __main__ - Step 163: {'lr': 4.05e-05, 'samples': 31296, 'steps': 162, 'loss/train': 6.731355667114258} +11/06/2021 21:18:04 - INFO - __main__ - Step 164: {'lr': 4.075e-05, 'samples': 31488, 'steps': 163, 'loss/train': 6.836953163146973} +11/06/2021 21:18:05 - INFO - __main__ - Step 165: {'lr': 4.1e-05, 'samples': 31680, 'steps': 164, 'loss/train': 6.64618444442749} +11/06/2021 21:18:06 - INFO - __main__ - Step 166: {'lr': 4.125e-05, 'samples': 31872, 'steps': 165, 'loss/train': 6.482452869415283} +11/06/2021 21:18:06 - INFO - __main__ - Step 167: {'lr': 4.1500000000000006e-05, 'samples': 32064, 'steps': 166, 'loss/train': 6.185523509979248} +11/06/2021 21:18:06 - INFO - __main__ - Step 168: {'lr': 4.1750000000000005e-05, 'samples': 32256, 'steps': 167, 'loss/train': 6.377339839935303} +11/06/2021 21:18:07 - INFO - __main__ - Step 169: {'lr': 4.2000000000000004e-05, 'samples': 32448, 'steps': 168, 'loss/train': 6.502751350402832} +11/06/2021 21:18:08 - INFO - __main__ - Step 170: {'lr': 4.2250000000000004e-05, 'samples': 32640, 'steps': 169, 'loss/train': 7.073266506195068} +11/06/2021 21:18:08 - INFO - __main__ - Step 171: {'lr': 4.25e-05, 'samples': 32832, 'steps': 170, 'loss/train': 6.543142318725586} +11/06/2021 21:18:08 - INFO - __main__ - Step 172: {'lr': 4.275e-05, 'samples': 33024, 'steps': 171, 'loss/train': 6.489956378936768} +11/06/2021 21:18:09 - INFO - __main__ - Step 173: {'lr': 4.2999999999999995e-05, 'samples': 33216, 'steps': 172, 'loss/train': 6.199307918548584} +11/06/2021 21:18:09 - INFO - __main__ - Step 174: {'lr': 4.325e-05, 'samples': 33408, 'steps': 173, 'loss/train': 6.356565475463867} +11/06/2021 21:18:10 - INFO - __main__ - Step 175: {'lr': 4.35e-05, 'samples': 33600, 'steps': 174, 'loss/train': 5.826794147491455} +11/06/2021 21:18:11 - INFO - __main__ - Step 176: {'lr': 4.375e-05, 'samples': 33792, 'steps': 175, 'loss/train': 7.043330192565918} +11/06/2021 21:18:11 - INFO - __main__ - Step 177: {'lr': 4.4e-05, 'samples': 33984, 'steps': 176, 'loss/train': 6.09688663482666} +11/06/2021 21:18:11 - INFO - __main__ - Step 178: {'lr': 4.425e-05, 'samples': 34176, 'steps': 177, 'loss/train': 6.213244915008545} +11/06/2021 21:18:12 - INFO - __main__ - Step 179: {'lr': 4.45e-05, 'samples': 34368, 'steps': 178, 'loss/train': 6.990470886230469} +11/06/2021 21:18:13 - INFO - __main__ - Step 180: {'lr': 4.475e-05, 'samples': 34560, 'steps': 179, 'loss/train': 6.256852149963379} +11/06/2021 21:18:13 - INFO - __main__ - Step 181: {'lr': 4.4999999999999996e-05, 'samples': 34752, 'steps': 180, 'loss/train': 7.177120685577393} +11/06/2021 21:18:13 - INFO - __main__ - Step 182: {'lr': 4.525e-05, 'samples': 34944, 'steps': 181, 'loss/train': 6.373216152191162} +11/06/2021 21:18:14 - INFO - __main__ - Step 183: {'lr': 4.55e-05, 'samples': 35136, 'steps': 182, 'loss/train': 7.0793328285217285} +11/06/2021 21:18:14 - INFO - __main__ - Step 184: {'lr': 4.575e-05, 'samples': 35328, 'steps': 183, 'loss/train': 6.392989158630371} +11/06/2021 21:18:15 - INFO - __main__ - Step 185: {'lr': 4.6e-05, 'samples': 35520, 'steps': 184, 'loss/train': 8.500471115112305} +11/06/2021 21:18:16 - INFO - __main__ - Step 186: {'lr': 4.625e-05, 'samples': 35712, 'steps': 185, 'loss/train': 6.313254356384277} +11/06/2021 21:18:16 - INFO - __main__ - Step 187: {'lr': 4.65e-05, 'samples': 35904, 'steps': 186, 'loss/train': 6.720587253570557} +11/06/2021 21:18:16 - INFO - __main__ - Step 188: {'lr': 4.675e-05, 'samples': 36096, 'steps': 187, 'loss/train': 5.526083469390869} +11/06/2021 21:18:17 - INFO - __main__ - Step 189: {'lr': 4.7000000000000004e-05, 'samples': 36288, 'steps': 188, 'loss/train': 5.93545389175415} +11/06/2021 21:18:17 - INFO - __main__ - Step 190: {'lr': 4.725e-05, 'samples': 36480, 'steps': 189, 'loss/train': 7.147458553314209} +11/06/2021 21:18:18 - INFO - __main__ - Step 191: {'lr': 4.75e-05, 'samples': 36672, 'steps': 190, 'loss/train': 6.479673385620117} +11/06/2021 21:18:18 - INFO - __main__ - Step 192: {'lr': 4.775e-05, 'samples': 36864, 'steps': 191, 'loss/train': 6.075639247894287} +11/06/2021 21:18:19 - INFO - __main__ - Step 193: {'lr': 4.8e-05, 'samples': 37056, 'steps': 192, 'loss/train': 6.69281005859375} +11/06/2021 21:18:19 - INFO - __main__ - Step 194: {'lr': 4.825e-05, 'samples': 37248, 'steps': 193, 'loss/train': 6.355683326721191} +11/06/2021 21:18:20 - INFO - __main__ - Step 195: {'lr': 4.85e-05, 'samples': 37440, 'steps': 194, 'loss/train': 6.180767059326172} +11/06/2021 21:18:20 - INFO - __main__ - Step 196: {'lr': 4.8750000000000006e-05, 'samples': 37632, 'steps': 195, 'loss/train': 5.40876579284668} +11/06/2021 21:18:21 - INFO - __main__ - Step 197: {'lr': 4.9000000000000005e-05, 'samples': 37824, 'steps': 196, 'loss/train': 7.284364700317383} +11/06/2021 21:18:21 - INFO - __main__ - Step 198: {'lr': 4.9250000000000004e-05, 'samples': 38016, 'steps': 197, 'loss/train': 6.532893180847168} +11/06/2021 21:18:22 - INFO - __main__ - Step 199: {'lr': 4.9500000000000004e-05, 'samples': 38208, 'steps': 198, 'loss/train': 6.542242527008057} +11/06/2021 21:18:22 - INFO - __main__ - Step 200: {'lr': 4.975e-05, 'samples': 38400, 'steps': 199, 'loss/train': 6.113000392913818} +11/06/2021 21:18:22 - INFO - __main__ - Step 201: {'lr': 5e-05, 'samples': 38592, 'steps': 200, 'loss/train': 6.284862995147705} +11/06/2021 21:18:23 - INFO - __main__ - Step 202: {'lr': 5.025e-05, 'samples': 38784, 'steps': 201, 'loss/train': 6.143826007843018} +11/06/2021 21:18:24 - INFO - __main__ - Step 203: {'lr': 5.05e-05, 'samples': 38976, 'steps': 202, 'loss/train': 6.595575332641602} +11/06/2021 21:18:24 - INFO - __main__ - Step 204: {'lr': 5.075000000000001e-05, 'samples': 39168, 'steps': 203, 'loss/train': 6.1036787033081055} +11/06/2021 21:18:24 - INFO - __main__ - Step 205: {'lr': 5.1e-05, 'samples': 39360, 'steps': 204, 'loss/train': 6.222804546356201} +11/06/2021 21:18:25 - INFO - __main__ - Step 206: {'lr': 5.125e-05, 'samples': 39552, 'steps': 205, 'loss/train': 5.817543029785156} +11/06/2021 21:18:26 - INFO - __main__ - Step 207: {'lr': 5.15e-05, 'samples': 39744, 'steps': 206, 'loss/train': 6.056823253631592} +11/06/2021 21:18:26 - INFO - __main__ - Step 208: {'lr': 5.175e-05, 'samples': 39936, 'steps': 207, 'loss/train': 6.261317729949951} +11/06/2021 21:18:27 - INFO - __main__ - Step 209: {'lr': 5.2e-05, 'samples': 40128, 'steps': 208, 'loss/train': 6.321830749511719} +11/06/2021 21:18:27 - INFO - __main__ - Step 210: {'lr': 5.2249999999999996e-05, 'samples': 40320, 'steps': 209, 'loss/train': 5.724458694458008} +11/06/2021 21:18:27 - INFO - __main__ - Step 211: {'lr': 5.25e-05, 'samples': 40512, 'steps': 210, 'loss/train': 6.434157371520996} +11/06/2021 21:18:28 - INFO - __main__ - Step 212: {'lr': 5.275e-05, 'samples': 40704, 'steps': 211, 'loss/train': 5.677988529205322} +11/06/2021 21:18:29 - INFO - __main__ - Step 213: {'lr': 5.3e-05, 'samples': 40896, 'steps': 212, 'loss/train': 5.744022846221924} +11/06/2021 21:18:29 - INFO - __main__ - Step 214: {'lr': 5.325e-05, 'samples': 41088, 'steps': 213, 'loss/train': 5.744656562805176} +11/06/2021 21:18:29 - INFO - __main__ - Step 215: {'lr': 5.35e-05, 'samples': 41280, 'steps': 214, 'loss/train': 5.984218597412109} +11/06/2021 21:18:30 - INFO - __main__ - Step 216: {'lr': 5.375e-05, 'samples': 41472, 'steps': 215, 'loss/train': 6.307746887207031} +11/06/2021 21:18:31 - INFO - __main__ - Step 217: {'lr': 5.4e-05, 'samples': 41664, 'steps': 216, 'loss/train': 6.040472030639648} +11/06/2021 21:18:31 - INFO - __main__ - Step 218: {'lr': 5.4250000000000004e-05, 'samples': 41856, 'steps': 217, 'loss/train': 6.029814720153809} +11/06/2021 21:18:31 - INFO - __main__ - Step 219: {'lr': 5.45e-05, 'samples': 42048, 'steps': 218, 'loss/train': 6.033048629760742} +11/06/2021 21:18:32 - INFO - __main__ - Step 220: {'lr': 5.475e-05, 'samples': 42240, 'steps': 219, 'loss/train': 5.9049153327941895} +11/06/2021 21:18:32 - INFO - __main__ - Step 221: {'lr': 5.5e-05, 'samples': 42432, 'steps': 220, 'loss/train': 6.097071170806885} +11/06/2021 21:18:33 - INFO - __main__ - Step 222: {'lr': 5.525e-05, 'samples': 42624, 'steps': 221, 'loss/train': 6.372702598571777} +11/06/2021 21:18:33 - INFO - __main__ - Step 223: {'lr': 5.55e-05, 'samples': 42816, 'steps': 222, 'loss/train': 7.301460266113281} +11/06/2021 21:18:34 - INFO - __main__ - Step 224: {'lr': 5.575e-05, 'samples': 43008, 'steps': 223, 'loss/train': 6.467023849487305} +11/06/2021 21:18:34 - INFO - __main__ - Step 225: {'lr': 5.6e-05, 'samples': 43200, 'steps': 224, 'loss/train': 6.188560962677002} +11/06/2021 21:18:34 - INFO - __main__ - Step 226: {'lr': 5.6250000000000005e-05, 'samples': 43392, 'steps': 225, 'loss/train': 5.94260311126709} +11/06/2021 21:18:36 - INFO - __main__ - Step 227: {'lr': 5.6500000000000005e-05, 'samples': 43584, 'steps': 226, 'loss/train': 5.925175189971924} +11/06/2021 21:18:36 - INFO - __main__ - Step 228: {'lr': 5.6750000000000004e-05, 'samples': 43776, 'steps': 227, 'loss/train': 5.587348937988281} +11/06/2021 21:18:36 - INFO - __main__ - Step 229: {'lr': 5.7e-05, 'samples': 43968, 'steps': 228, 'loss/train': 5.978050231933594} +11/06/2021 21:18:37 - INFO - __main__ - Step 230: {'lr': 5.725e-05, 'samples': 44160, 'steps': 229, 'loss/train': 5.728048324584961} +11/06/2021 21:18:37 - INFO - __main__ - Step 231: {'lr': 5.75e-05, 'samples': 44352, 'steps': 230, 'loss/train': 6.196109771728516} +11/06/2021 21:18:37 - INFO - __main__ - Step 232: {'lr': 5.775e-05, 'samples': 44544, 'steps': 231, 'loss/train': 6.567146301269531} +11/06/2021 21:18:38 - INFO - __main__ - Step 233: {'lr': 5.800000000000001e-05, 'samples': 44736, 'steps': 232, 'loss/train': 5.301417827606201} +11/06/2021 21:18:39 - INFO - __main__ - Step 234: {'lr': 5.8250000000000006e-05, 'samples': 44928, 'steps': 233, 'loss/train': 5.6201348304748535} +11/06/2021 21:18:39 - INFO - __main__ - Step 235: {'lr': 5.8500000000000006e-05, 'samples': 45120, 'steps': 234, 'loss/train': 5.957462787628174} +11/06/2021 21:18:39 - INFO - __main__ - Step 236: {'lr': 5.875e-05, 'samples': 45312, 'steps': 235, 'loss/train': 6.2582688331604} +11/06/2021 21:18:40 - INFO - __main__ - Step 237: {'lr': 5.9e-05, 'samples': 45504, 'steps': 236, 'loss/train': 5.807918071746826} +11/06/2021 21:18:41 - INFO - __main__ - Step 238: {'lr': 5.925e-05, 'samples': 45696, 'steps': 237, 'loss/train': 5.977503299713135} +11/06/2021 21:18:41 - INFO - __main__ - Step 239: {'lr': 5.9499999999999996e-05, 'samples': 45888, 'steps': 238, 'loss/train': 5.574709892272949} +11/06/2021 21:18:42 - INFO - __main__ - Step 240: {'lr': 5.9749999999999995e-05, 'samples': 46080, 'steps': 239, 'loss/train': 5.93025016784668} +11/06/2021 21:18:42 - INFO - __main__ - Step 241: {'lr': 6e-05, 'samples': 46272, 'steps': 240, 'loss/train': 5.585808277130127} +11/06/2021 21:18:42 - INFO - __main__ - Step 242: {'lr': 6.025e-05, 'samples': 46464, 'steps': 241, 'loss/train': 6.203149318695068} +11/06/2021 21:18:43 - INFO - __main__ - Step 243: {'lr': 6.05e-05, 'samples': 46656, 'steps': 242, 'loss/train': 4.716400623321533} +11/06/2021 21:18:44 - INFO - __main__ - Step 244: {'lr': 6.075e-05, 'samples': 46848, 'steps': 243, 'loss/train': 5.850978851318359} +11/06/2021 21:18:44 - INFO - __main__ - Step 245: {'lr': 6.1e-05, 'samples': 47040, 'steps': 244, 'loss/train': 5.889804840087891} +11/06/2021 21:18:44 - INFO - __main__ - Step 246: {'lr': 6.125e-05, 'samples': 47232, 'steps': 245, 'loss/train': 5.8663225173950195} +11/06/2021 21:18:45 - INFO - __main__ - Step 247: {'lr': 6.15e-05, 'samples': 47424, 'steps': 246, 'loss/train': 5.8062334060668945} +11/06/2021 21:18:45 - INFO - __main__ - Step 248: {'lr': 6.175e-05, 'samples': 47616, 'steps': 247, 'loss/train': 5.754123210906982} +11/06/2021 21:18:46 - INFO - __main__ - Step 249: {'lr': 6.2e-05, 'samples': 47808, 'steps': 248, 'loss/train': 5.87885856628418} +11/06/2021 21:18:47 - INFO - __main__ - Step 250: {'lr': 6.225e-05, 'samples': 48000, 'steps': 249, 'loss/train': 5.715115070343018} +11/06/2021 21:18:47 - INFO - __main__ - Step 251: {'lr': 6.25e-05, 'samples': 48192, 'steps': 250, 'loss/train': 5.726807594299316} +11/06/2021 21:18:47 - INFO - __main__ - Step 252: {'lr': 6.275000000000001e-05, 'samples': 48384, 'steps': 251, 'loss/train': 5.94719934463501} +11/06/2021 21:18:48 - INFO - __main__ - Step 253: {'lr': 6.3e-05, 'samples': 48576, 'steps': 252, 'loss/train': 5.911177158355713} +11/06/2021 21:18:49 - INFO - __main__ - Step 254: {'lr': 6.325e-05, 'samples': 48768, 'steps': 253, 'loss/train': 5.7925004959106445} +11/06/2021 21:18:49 - INFO - __main__ - Step 255: {'lr': 6.35e-05, 'samples': 48960, 'steps': 254, 'loss/train': 5.541946887969971} +11/06/2021 21:18:50 - INFO - __main__ - Step 256: {'lr': 6.375e-05, 'samples': 49152, 'steps': 255, 'loss/train': 5.5716233253479} +11/06/2021 21:18:50 - INFO - __main__ - Step 257: {'lr': 6.4e-05, 'samples': 49344, 'steps': 256, 'loss/train': 6.297529697418213} +11/06/2021 21:18:50 - INFO - __main__ - Step 258: {'lr': 6.425e-05, 'samples': 49536, 'steps': 257, 'loss/train': 4.350067138671875} +11/06/2021 21:18:51 - INFO - __main__ - Step 259: {'lr': 6.450000000000001e-05, 'samples': 49728, 'steps': 258, 'loss/train': 5.1816887855529785} +11/06/2021 21:18:52 - INFO - __main__ - Step 260: {'lr': 6.475e-05, 'samples': 49920, 'steps': 259, 'loss/train': 3.9729881286621094} +11/06/2021 21:18:52 - INFO - __main__ - Step 261: {'lr': 6.500000000000001e-05, 'samples': 50112, 'steps': 260, 'loss/train': 5.403891563415527} +11/06/2021 21:18:52 - INFO - __main__ - Step 262: {'lr': 6.525e-05, 'samples': 50304, 'steps': 261, 'loss/train': 6.115725517272949} +11/06/2021 21:18:53 - INFO - __main__ - Step 263: {'lr': 6.55e-05, 'samples': 50496, 'steps': 262, 'loss/train': 6.0679426193237305} +11/06/2021 21:18:53 - INFO - __main__ - Step 264: {'lr': 6.575e-05, 'samples': 50688, 'steps': 263, 'loss/train': 5.964505195617676} +11/06/2021 21:18:54 - INFO - __main__ - Step 265: {'lr': 6.6e-05, 'samples': 50880, 'steps': 264, 'loss/train': 5.48927640914917} +11/06/2021 21:18:55 - INFO - __main__ - Step 266: {'lr': 6.625000000000001e-05, 'samples': 51072, 'steps': 265, 'loss/train': 6.112322807312012} +11/06/2021 21:18:55 - INFO - __main__ - Step 267: {'lr': 6.65e-05, 'samples': 51264, 'steps': 266, 'loss/train': 6.019900798797607} +11/06/2021 21:18:55 - INFO - __main__ - Step 268: {'lr': 6.675000000000001e-05, 'samples': 51456, 'steps': 267, 'loss/train': 6.1478657722473145} +11/06/2021 21:18:56 - INFO - __main__ - Step 269: {'lr': 6.7e-05, 'samples': 51648, 'steps': 268, 'loss/train': 5.52264404296875} +11/06/2021 21:18:57 - INFO - __main__ - Step 270: {'lr': 6.725000000000001e-05, 'samples': 51840, 'steps': 269, 'loss/train': 5.913082599639893} +11/06/2021 21:18:57 - INFO - __main__ - Step 271: {'lr': 6.75e-05, 'samples': 52032, 'steps': 270, 'loss/train': 5.843954086303711} +11/06/2021 21:18:57 - INFO - __main__ - Step 272: {'lr': 6.775000000000001e-05, 'samples': 52224, 'steps': 271, 'loss/train': 5.43068790435791} +11/06/2021 21:18:58 - INFO - __main__ - Step 273: {'lr': 6.800000000000001e-05, 'samples': 52416, 'steps': 272, 'loss/train': 5.731388568878174} +11/06/2021 21:18:58 - INFO - __main__ - Step 274: {'lr': 6.825e-05, 'samples': 52608, 'steps': 273, 'loss/train': 6.002760887145996} +11/06/2021 21:18:59 - INFO - __main__ - Step 275: {'lr': 6.850000000000001e-05, 'samples': 52800, 'steps': 274, 'loss/train': 5.909034729003906} +11/06/2021 21:18:59 - INFO - __main__ - Step 276: {'lr': 6.875e-05, 'samples': 52992, 'steps': 275, 'loss/train': 5.980253219604492} +11/06/2021 21:19:00 - INFO - __main__ - Step 277: {'lr': 6.900000000000001e-05, 'samples': 53184, 'steps': 276, 'loss/train': 5.36932373046875} +11/06/2021 21:19:00 - INFO - __main__ - Step 278: {'lr': 6.925e-05, 'samples': 53376, 'steps': 277, 'loss/train': 5.7302045822143555} +11/06/2021 21:19:00 - INFO - __main__ - Step 279: {'lr': 6.950000000000001e-05, 'samples': 53568, 'steps': 278, 'loss/train': 5.460746765136719} +11/06/2021 21:19:01 - INFO - __main__ - Step 280: {'lr': 6.975e-05, 'samples': 53760, 'steps': 279, 'loss/train': 5.948640823364258} +11/06/2021 21:19:02 - INFO - __main__ - Step 281: {'lr': 7.000000000000001e-05, 'samples': 53952, 'steps': 280, 'loss/train': 5.746571063995361} +11/06/2021 21:19:02 - INFO - __main__ - Step 282: {'lr': 7.025000000000001e-05, 'samples': 54144, 'steps': 281, 'loss/train': 6.098116874694824} +11/06/2021 21:19:03 - INFO - __main__ - Step 283: {'lr': 7.049999999999999e-05, 'samples': 54336, 'steps': 282, 'loss/train': 5.805056571960449} +11/06/2021 21:19:03 - INFO - __main__ - Step 284: {'lr': 7.075e-05, 'samples': 54528, 'steps': 283, 'loss/train': 5.200248718261719} +11/06/2021 21:19:04 - INFO - __main__ - Step 285: {'lr': 7.099999999999999e-05, 'samples': 54720, 'steps': 284, 'loss/train': 6.579744815826416} +11/06/2021 21:19:04 - INFO - __main__ - Step 286: {'lr': 7.125e-05, 'samples': 54912, 'steps': 285, 'loss/train': 5.594106197357178} +11/06/2021 21:19:05 - INFO - __main__ - Step 287: {'lr': 7.149999999999999e-05, 'samples': 55104, 'steps': 286, 'loss/train': 6.083644390106201} +11/06/2021 21:19:05 - INFO - __main__ - Step 288: {'lr': 7.175e-05, 'samples': 55296, 'steps': 287, 'loss/train': 5.514430999755859} +11/06/2021 21:19:05 - INFO - __main__ - Step 289: {'lr': 7.2e-05, 'samples': 55488, 'steps': 288, 'loss/train': 5.3459954261779785} +11/06/2021 21:19:06 - INFO - __main__ - Step 290: {'lr': 7.225e-05, 'samples': 55680, 'steps': 289, 'loss/train': 6.18521785736084} +11/06/2021 21:19:07 - INFO - __main__ - Step 291: {'lr': 7.25e-05, 'samples': 55872, 'steps': 290, 'loss/train': 6.124849319458008} +11/06/2021 21:19:07 - INFO - __main__ - Step 292: {'lr': 7.274999999999999e-05, 'samples': 56064, 'steps': 291, 'loss/train': 5.46663761138916} +11/06/2021 21:19:07 - INFO - __main__ - Step 293: {'lr': 7.3e-05, 'samples': 56256, 'steps': 292, 'loss/train': 5.0395188331604} +11/06/2021 21:19:08 - INFO - __main__ - Step 294: {'lr': 7.324999999999999e-05, 'samples': 56448, 'steps': 293, 'loss/train': 5.422224998474121} +11/06/2021 21:19:08 - INFO - __main__ - Step 295: {'lr': 7.35e-05, 'samples': 56640, 'steps': 294, 'loss/train': 5.153810024261475} +11/06/2021 21:19:09 - INFO - __main__ - Step 296: {'lr': 7.375e-05, 'samples': 56832, 'steps': 295, 'loss/train': 5.397673606872559} +11/06/2021 21:19:10 - INFO - __main__ - Step 297: {'lr': 7.4e-05, 'samples': 57024, 'steps': 296, 'loss/train': 5.323544979095459} +11/06/2021 21:19:10 - INFO - __main__ - Step 298: {'lr': 7.425e-05, 'samples': 57216, 'steps': 297, 'loss/train': 5.2873454093933105} +11/06/2021 21:19:10 - INFO - __main__ - Step 299: {'lr': 7.45e-05, 'samples': 57408, 'steps': 298, 'loss/train': 5.626234531402588} +11/06/2021 21:19:11 - INFO - __main__ - Step 300: {'lr': 7.475e-05, 'samples': 57600, 'steps': 299, 'loss/train': 5.648954391479492} +11/06/2021 21:19:12 - INFO - __main__ - Step 301: {'lr': 7.5e-05, 'samples': 57792, 'steps': 300, 'loss/train': 6.47790002822876} +11/06/2021 21:19:12 - INFO - __main__ - Step 302: {'lr': 7.525e-05, 'samples': 57984, 'steps': 301, 'loss/train': 5.377347469329834} +11/06/2021 21:19:12 - INFO - __main__ - Step 303: {'lr': 7.55e-05, 'samples': 58176, 'steps': 302, 'loss/train': 5.396330833435059} +11/06/2021 21:19:13 - INFO - __main__ - Step 304: {'lr': 7.575e-05, 'samples': 58368, 'steps': 303, 'loss/train': 6.444887161254883} +11/06/2021 21:19:13 - INFO - __main__ - Step 305: {'lr': 7.6e-05, 'samples': 58560, 'steps': 304, 'loss/train': 5.51333475112915} +11/06/2021 21:19:14 - INFO - __main__ - Step 306: {'lr': 7.625e-05, 'samples': 58752, 'steps': 305, 'loss/train': 5.4495744705200195} +11/06/2021 21:19:15 - INFO - __main__ - Step 307: {'lr': 7.65e-05, 'samples': 58944, 'steps': 306, 'loss/train': 5.420361518859863} +11/06/2021 21:19:15 - INFO - __main__ - Step 308: {'lr': 7.675e-05, 'samples': 59136, 'steps': 307, 'loss/train': 5.876494407653809} +11/06/2021 21:19:15 - INFO - __main__ - Step 309: {'lr': 7.7e-05, 'samples': 59328, 'steps': 308, 'loss/train': 5.0450520515441895} +11/06/2021 21:19:16 - INFO - __main__ - Step 310: {'lr': 7.725000000000001e-05, 'samples': 59520, 'steps': 309, 'loss/train': 5.425472736358643} +11/06/2021 21:19:17 - INFO - __main__ - Step 311: {'lr': 7.75e-05, 'samples': 59712, 'steps': 310, 'loss/train': 5.596251010894775} +11/06/2021 21:19:17 - INFO - __main__ - Step 312: {'lr': 7.775e-05, 'samples': 59904, 'steps': 311, 'loss/train': 5.2670392990112305} +11/06/2021 21:19:17 - INFO - __main__ - Step 313: {'lr': 7.8e-05, 'samples': 60096, 'steps': 312, 'loss/train': 7.779051780700684} +11/06/2021 21:19:18 - INFO - __main__ - Step 314: {'lr': 7.825e-05, 'samples': 60288, 'steps': 313, 'loss/train': 5.498117923736572} +11/06/2021 21:19:18 - INFO - __main__ - Step 315: {'lr': 7.85e-05, 'samples': 60480, 'steps': 314, 'loss/train': 5.533538341522217} +11/06/2021 21:19:19 - INFO - __main__ - Step 316: {'lr': 7.875e-05, 'samples': 60672, 'steps': 315, 'loss/train': 5.794958591461182} +11/06/2021 21:19:19 - INFO - __main__ - Step 317: {'lr': 7.9e-05, 'samples': 60864, 'steps': 316, 'loss/train': 5.267005443572998} +11/06/2021 21:19:20 - INFO - __main__ - Step 318: {'lr': 7.925e-05, 'samples': 61056, 'steps': 317, 'loss/train': 5.625141143798828} +11/06/2021 21:19:20 - INFO - __main__ - Step 319: {'lr': 7.950000000000001e-05, 'samples': 61248, 'steps': 318, 'loss/train': 5.229969024658203} +11/06/2021 21:19:21 - INFO - __main__ - Step 320: {'lr': 7.975e-05, 'samples': 61440, 'steps': 319, 'loss/train': 5.5839314460754395} +11/06/2021 21:19:21 - INFO - __main__ - Step 321: {'lr': 8e-05, 'samples': 61632, 'steps': 320, 'loss/train': 5.807913303375244} +11/06/2021 21:19:22 - INFO - __main__ - Step 322: {'lr': 8.025e-05, 'samples': 61824, 'steps': 321, 'loss/train': 5.966512203216553} +11/06/2021 21:19:22 - INFO - __main__ - Step 323: {'lr': 8.05e-05, 'samples': 62016, 'steps': 322, 'loss/train': 5.348308563232422} +11/06/2021 21:19:23 - INFO - __main__ - Step 324: {'lr': 8.075e-05, 'samples': 62208, 'steps': 323, 'loss/train': 5.878225326538086} +11/06/2021 21:19:23 - INFO - __main__ - Step 325: {'lr': 8.1e-05, 'samples': 62400, 'steps': 324, 'loss/train': 5.854434013366699} +11/06/2021 21:19:23 - INFO - __main__ - Step 326: {'lr': 8.125000000000001e-05, 'samples': 62592, 'steps': 325, 'loss/train': 5.428937911987305} +11/06/2021 21:19:24 - INFO - __main__ - Step 327: {'lr': 8.15e-05, 'samples': 62784, 'steps': 326, 'loss/train': 5.665132522583008} +11/06/2021 21:19:25 - INFO - __main__ - Step 328: {'lr': 8.175000000000001e-05, 'samples': 62976, 'steps': 327, 'loss/train': 5.691938400268555} +11/06/2021 21:19:25 - INFO - __main__ - Step 329: {'lr': 8.2e-05, 'samples': 63168, 'steps': 328, 'loss/train': 6.869819641113281} +11/06/2021 21:19:26 - INFO - __main__ - Step 330: {'lr': 8.225000000000001e-05, 'samples': 63360, 'steps': 329, 'loss/train': 4.917605876922607} +11/06/2021 21:19:26 - INFO - __main__ - Step 331: {'lr': 8.25e-05, 'samples': 63552, 'steps': 330, 'loss/train': 5.495372295379639} +11/06/2021 21:19:27 - INFO - __main__ - Step 332: {'lr': 8.275e-05, 'samples': 63744, 'steps': 331, 'loss/train': 5.180616855621338} +11/06/2021 21:19:27 - INFO - __main__ - Step 333: {'lr': 8.300000000000001e-05, 'samples': 63936, 'steps': 332, 'loss/train': 5.5182318687438965} +11/06/2021 21:19:28 - INFO - __main__ - Step 334: {'lr': 8.325e-05, 'samples': 64128, 'steps': 333, 'loss/train': 5.079967975616455} +11/06/2021 21:19:28 - INFO - __main__ - Step 335: {'lr': 8.350000000000001e-05, 'samples': 64320, 'steps': 334, 'loss/train': 5.6893181800842285} +11/06/2021 21:19:28 - INFO - __main__ - Step 336: {'lr': 8.375e-05, 'samples': 64512, 'steps': 335, 'loss/train': 5.519853115081787} +11/06/2021 21:19:29 - INFO - __main__ - Step 337: {'lr': 8.400000000000001e-05, 'samples': 64704, 'steps': 336, 'loss/train': 5.515233516693115} +11/06/2021 21:19:30 - INFO - __main__ - Step 338: {'lr': 8.425e-05, 'samples': 64896, 'steps': 337, 'loss/train': 4.627192974090576} +11/06/2021 21:19:30 - INFO - __main__ - Step 339: {'lr': 8.450000000000001e-05, 'samples': 65088, 'steps': 338, 'loss/train': 5.647910118103027} +11/06/2021 21:19:30 - INFO - __main__ - Step 340: {'lr': 8.475000000000001e-05, 'samples': 65280, 'steps': 339, 'loss/train': 5.477786540985107} +11/06/2021 21:19:31 - INFO - __main__ - Step 341: {'lr': 8.5e-05, 'samples': 65472, 'steps': 340, 'loss/train': 5.654776573181152} +11/06/2021 21:19:32 - INFO - __main__ - Step 342: {'lr': 8.525000000000001e-05, 'samples': 65664, 'steps': 341, 'loss/train': 5.568868637084961} +11/06/2021 21:19:32 - INFO - __main__ - Step 343: {'lr': 8.55e-05, 'samples': 65856, 'steps': 342, 'loss/train': 3.5874297618865967} +11/06/2021 21:19:33 - INFO - __main__ - Step 344: {'lr': 8.575000000000001e-05, 'samples': 66048, 'steps': 343, 'loss/train': 5.646244525909424} +11/06/2021 21:19:33 - INFO - __main__ - Step 345: {'lr': 8.599999999999999e-05, 'samples': 66240, 'steps': 344, 'loss/train': 5.599254131317139} +11/06/2021 21:19:33 - INFO - __main__ - Step 346: {'lr': 8.625e-05, 'samples': 66432, 'steps': 345, 'loss/train': 5.349778652191162} +11/06/2021 21:19:34 - INFO - __main__ - Step 347: {'lr': 8.65e-05, 'samples': 66624, 'steps': 346, 'loss/train': 5.612128257751465} +11/06/2021 21:19:35 - INFO - __main__ - Step 348: {'lr': 8.675e-05, 'samples': 66816, 'steps': 347, 'loss/train': 5.6107988357543945} +11/06/2021 21:19:35 - INFO - __main__ - Step 349: {'lr': 8.7e-05, 'samples': 67008, 'steps': 348, 'loss/train': 5.735456943511963} +11/06/2021 21:19:35 - INFO - __main__ - Step 350: {'lr': 8.724999999999999e-05, 'samples': 67200, 'steps': 349, 'loss/train': 5.3645172119140625} +11/06/2021 21:19:36 - INFO - __main__ - Step 351: {'lr': 8.75e-05, 'samples': 67392, 'steps': 350, 'loss/train': 5.467144966125488} +11/06/2021 21:19:36 - INFO - __main__ - Step 352: {'lr': 8.774999999999999e-05, 'samples': 67584, 'steps': 351, 'loss/train': 6.211921215057373} +11/06/2021 21:19:37 - INFO - __main__ - Step 353: {'lr': 8.8e-05, 'samples': 67776, 'steps': 352, 'loss/train': 5.452548980712891} +11/06/2021 21:19:37 - INFO - __main__ - Step 354: {'lr': 8.824999999999999e-05, 'samples': 67968, 'steps': 353, 'loss/train': 5.824997901916504} +11/06/2021 21:19:38 - INFO - __main__ - Step 355: {'lr': 8.85e-05, 'samples': 68160, 'steps': 354, 'loss/train': 5.646512985229492} +11/06/2021 21:19:38 - INFO - __main__ - Step 356: {'lr': 8.875e-05, 'samples': 68352, 'steps': 355, 'loss/train': 5.443009853363037} +11/06/2021 21:19:39 - INFO - __main__ - Step 357: {'lr': 8.9e-05, 'samples': 68544, 'steps': 356, 'loss/train': 5.597517490386963} +11/06/2021 21:19:40 - INFO - __main__ - Step 358: {'lr': 8.925e-05, 'samples': 68736, 'steps': 357, 'loss/train': 5.510553359985352} +11/06/2021 21:19:40 - INFO - __main__ - Step 359: {'lr': 8.95e-05, 'samples': 68928, 'steps': 358, 'loss/train': 5.271029949188232} +11/06/2021 21:19:40 - INFO - __main__ - Step 360: {'lr': 8.975e-05, 'samples': 69120, 'steps': 359, 'loss/train': 5.6077141761779785} +11/06/2021 21:19:41 - INFO - __main__ - Step 361: {'lr': 8.999999999999999e-05, 'samples': 69312, 'steps': 360, 'loss/train': 7.289037227630615} +11/06/2021 21:19:41 - INFO - __main__ - Step 362: {'lr': 9.025e-05, 'samples': 69504, 'steps': 361, 'loss/train': 5.1300740242004395} +11/06/2021 21:19:42 - INFO - __main__ - Step 363: {'lr': 9.05e-05, 'samples': 69696, 'steps': 362, 'loss/train': 5.349740982055664} +11/06/2021 21:19:42 - INFO - __main__ - Step 364: {'lr': 9.075e-05, 'samples': 69888, 'steps': 363, 'loss/train': 5.435561656951904} +11/06/2021 21:19:43 - INFO - __main__ - Step 365: {'lr': 9.1e-05, 'samples': 70080, 'steps': 364, 'loss/train': 5.4572978019714355} +11/06/2021 21:19:43 - INFO - __main__ - Step 366: {'lr': 9.125e-05, 'samples': 70272, 'steps': 365, 'loss/train': 5.351955890655518} +11/06/2021 21:19:43 - INFO - __main__ - Step 367: {'lr': 9.15e-05, 'samples': 70464, 'steps': 366, 'loss/train': 5.565761089324951} +11/06/2021 21:19:44 - INFO - __main__ - Step 368: {'lr': 9.175e-05, 'samples': 70656, 'steps': 367, 'loss/train': 5.959819316864014} +11/06/2021 21:19:45 - INFO - __main__ - Step 369: {'lr': 9.2e-05, 'samples': 70848, 'steps': 368, 'loss/train': 5.474288463592529} +11/06/2021 21:19:45 - INFO - __main__ - Step 370: {'lr': 9.225e-05, 'samples': 71040, 'steps': 369, 'loss/train': 5.607541561126709} +11/06/2021 21:19:46 - INFO - __main__ - Step 371: {'lr': 9.25e-05, 'samples': 71232, 'steps': 370, 'loss/train': 5.084637641906738} +11/06/2021 21:19:46 - INFO - __main__ - Step 372: {'lr': 9.275e-05, 'samples': 71424, 'steps': 371, 'loss/train': 4.969635009765625} +11/06/2021 21:19:46 - INFO - __main__ - Step 373: {'lr': 9.3e-05, 'samples': 71616, 'steps': 372, 'loss/train': 5.273648262023926} +11/06/2021 21:19:47 - INFO - __main__ - Step 374: {'lr': 9.325e-05, 'samples': 71808, 'steps': 373, 'loss/train': 5.385776042938232} +11/06/2021 21:19:48 - INFO - __main__ - Step 375: {'lr': 9.35e-05, 'samples': 72000, 'steps': 374, 'loss/train': 4.57074499130249} +11/06/2021 21:19:48 - INFO - __main__ - Step 376: {'lr': 9.375e-05, 'samples': 72192, 'steps': 375, 'loss/train': 5.399175643920898} +11/06/2021 21:19:48 - INFO - __main__ - Step 377: {'lr': 9.400000000000001e-05, 'samples': 72384, 'steps': 376, 'loss/train': 5.5180864334106445} +11/06/2021 21:19:49 - INFO - __main__ - Step 378: {'lr': 9.425e-05, 'samples': 72576, 'steps': 377, 'loss/train': 5.192264556884766} +11/06/2021 21:19:50 - INFO - __main__ - Step 379: {'lr': 9.45e-05, 'samples': 72768, 'steps': 378, 'loss/train': 5.126402854919434} +11/06/2021 21:19:50 - INFO - __main__ - Step 380: {'lr': 9.475e-05, 'samples': 72960, 'steps': 379, 'loss/train': 5.3973708152771} +11/06/2021 21:19:50 - INFO - __main__ - Step 381: {'lr': 9.5e-05, 'samples': 73152, 'steps': 380, 'loss/train': 5.583156585693359} +11/06/2021 21:19:51 - INFO - __main__ - Step 382: {'lr': 9.525e-05, 'samples': 73344, 'steps': 381, 'loss/train': 5.458894729614258} +11/06/2021 21:19:51 - INFO - __main__ - Step 383: {'lr': 9.55e-05, 'samples': 73536, 'steps': 382, 'loss/train': 5.020319938659668} +11/06/2021 21:19:52 - INFO - __main__ - Step 384: {'lr': 9.575000000000001e-05, 'samples': 73728, 'steps': 383, 'loss/train': 5.400721073150635} +11/06/2021 21:19:53 - INFO - __main__ - Step 385: {'lr': 9.6e-05, 'samples': 73920, 'steps': 384, 'loss/train': 5.1949381828308105} +11/06/2021 21:19:53 - INFO - __main__ - Step 386: {'lr': 9.625000000000001e-05, 'samples': 74112, 'steps': 385, 'loss/train': 5.291417121887207} +11/06/2021 21:19:53 - INFO - __main__ - Step 387: {'lr': 9.65e-05, 'samples': 74304, 'steps': 386, 'loss/train': 6.089571475982666} +11/06/2021 21:19:54 - INFO - __main__ - Step 388: {'lr': 9.675000000000001e-05, 'samples': 74496, 'steps': 387, 'loss/train': 5.51926326751709} +11/06/2021 21:19:55 - INFO - __main__ - Step 389: {'lr': 9.7e-05, 'samples': 74688, 'steps': 388, 'loss/train': 5.781015396118164} +11/06/2021 21:19:55 - INFO - __main__ - Step 390: {'lr': 9.725e-05, 'samples': 74880, 'steps': 389, 'loss/train': 4.908177852630615} +11/06/2021 21:19:55 - INFO - __main__ - Step 391: {'lr': 9.750000000000001e-05, 'samples': 75072, 'steps': 390, 'loss/train': 5.012897968292236} +11/06/2021 21:19:56 - INFO - __main__ - Step 392: {'lr': 9.775e-05, 'samples': 75264, 'steps': 391, 'loss/train': 5.399777889251709} +11/06/2021 21:19:56 - INFO - __main__ - Step 393: {'lr': 9.800000000000001e-05, 'samples': 75456, 'steps': 392, 'loss/train': 5.350080966949463} +11/06/2021 21:19:57 - INFO - __main__ - Step 394: {'lr': 9.825e-05, 'samples': 75648, 'steps': 393, 'loss/train': 5.737140655517578} +11/06/2021 21:19:57 - INFO - __main__ - Step 395: {'lr': 9.850000000000001e-05, 'samples': 75840, 'steps': 394, 'loss/train': 5.23768949508667} +11/06/2021 21:19:58 - INFO - __main__ - Step 396: {'lr': 9.875e-05, 'samples': 76032, 'steps': 395, 'loss/train': 5.202757358551025} +11/06/2021 21:19:58 - INFO - __main__ - Step 397: {'lr': 9.900000000000001e-05, 'samples': 76224, 'steps': 396, 'loss/train': 5.724830150604248} +11/06/2021 21:19:59 - INFO - __main__ - Step 398: {'lr': 9.925000000000001e-05, 'samples': 76416, 'steps': 397, 'loss/train': 6.981353282928467} +11/06/2021 21:19:59 - INFO - __main__ - Step 399: {'lr': 9.95e-05, 'samples': 76608, 'steps': 398, 'loss/train': 7.47460412979126} +11/06/2021 21:20:00 - INFO - __main__ - Step 400: {'lr': 9.975000000000001e-05, 'samples': 76800, 'steps': 399, 'loss/train': 5.741088390350342} +11/06/2021 21:20:00 - INFO - __main__ - Step 401: {'lr': 0.0001, 'samples': 76992, 'steps': 400, 'loss/train': 5.029991626739502} +11/06/2021 21:20:01 - INFO - __main__ - Step 402: {'lr': 0.00010025000000000001, 'samples': 77184, 'steps': 401, 'loss/train': 5.318662166595459} +11/06/2021 21:20:01 - INFO - __main__ - Step 403: {'lr': 0.0001005, 'samples': 77376, 'steps': 402, 'loss/train': 5.997198104858398} +11/06/2021 21:20:01 - INFO - __main__ - Step 404: {'lr': 0.00010075000000000001, 'samples': 77568, 'steps': 403, 'loss/train': 6.158583641052246} +11/06/2021 21:20:02 - INFO - __main__ - Step 405: {'lr': 0.000101, 'samples': 77760, 'steps': 404, 'loss/train': 5.336831569671631} +11/06/2021 21:20:03 - INFO - __main__ - Step 406: {'lr': 0.00010125000000000001, 'samples': 77952, 'steps': 405, 'loss/train': 5.227279186248779} +11/06/2021 21:20:03 - INFO - __main__ - Step 407: {'lr': 0.00010150000000000001, 'samples': 78144, 'steps': 406, 'loss/train': 5.527342319488525} +11/06/2021 21:20:03 - INFO - __main__ - Step 408: {'lr': 0.00010174999999999999, 'samples': 78336, 'steps': 407, 'loss/train': 5.73346471786499} +11/06/2021 21:20:04 - INFO - __main__ - Step 409: {'lr': 0.000102, 'samples': 78528, 'steps': 408, 'loss/train': 6.215020179748535} +11/06/2021 21:20:05 - INFO - __main__ - Step 410: {'lr': 0.00010224999999999999, 'samples': 78720, 'steps': 409, 'loss/train': 5.491655349731445} +11/06/2021 21:20:05 - INFO - __main__ - Step 411: {'lr': 0.0001025, 'samples': 78912, 'steps': 410, 'loss/train': 4.847282886505127} +11/06/2021 21:20:05 - INFO - __main__ - Step 412: {'lr': 0.00010274999999999999, 'samples': 79104, 'steps': 411, 'loss/train': 5.18861198425293} +11/06/2021 21:20:06 - INFO - __main__ - Step 413: {'lr': 0.000103, 'samples': 79296, 'steps': 412, 'loss/train': 5.54094934463501} +11/06/2021 21:20:06 - INFO - __main__ - Step 414: {'lr': 0.00010325, 'samples': 79488, 'steps': 413, 'loss/train': 5.201007843017578} +11/06/2021 21:20:07 - INFO - __main__ - Step 415: {'lr': 0.0001035, 'samples': 79680, 'steps': 414, 'loss/train': 5.937044143676758} +11/06/2021 21:20:08 - INFO - __main__ - Step 416: {'lr': 0.00010375, 'samples': 79872, 'steps': 415, 'loss/train': 5.265571117401123} +11/06/2021 21:20:08 - INFO - __main__ - Step 417: {'lr': 0.000104, 'samples': 80064, 'steps': 416, 'loss/train': 4.91490364074707} +11/06/2021 21:20:08 - INFO - __main__ - Step 418: {'lr': 0.00010425, 'samples': 80256, 'steps': 417, 'loss/train': 5.490600109100342} +11/06/2021 21:20:09 - INFO - __main__ - Step 419: {'lr': 0.00010449999999999999, 'samples': 80448, 'steps': 418, 'loss/train': 4.848526954650879} +11/06/2021 21:20:10 - INFO - __main__ - Step 420: {'lr': 0.00010475, 'samples': 80640, 'steps': 419, 'loss/train': 5.088794231414795} +11/06/2021 21:20:10 - INFO - __main__ - Step 421: {'lr': 0.000105, 'samples': 80832, 'steps': 420, 'loss/train': 5.438802719116211} +11/06/2021 21:20:10 - INFO - __main__ - Step 422: {'lr': 0.00010525, 'samples': 81024, 'steps': 421, 'loss/train': 5.321382522583008} +11/06/2021 21:20:11 - INFO - __main__ - Step 423: {'lr': 0.0001055, 'samples': 81216, 'steps': 422, 'loss/train': 5.291647434234619} +11/06/2021 21:20:11 - INFO - __main__ - Step 424: {'lr': 0.00010575, 'samples': 81408, 'steps': 423, 'loss/train': 4.753524303436279} +11/06/2021 21:20:11 - INFO - __main__ - Step 425: {'lr': 0.000106, 'samples': 81600, 'steps': 424, 'loss/train': 5.298032760620117} +11/06/2021 21:20:13 - INFO - __main__ - Step 426: {'lr': 0.00010625, 'samples': 81792, 'steps': 425, 'loss/train': 6.007701873779297} +11/06/2021 21:20:13 - INFO - __main__ - Step 427: {'lr': 0.0001065, 'samples': 81984, 'steps': 426, 'loss/train': 5.437173366546631} +11/06/2021 21:20:13 - INFO - __main__ - Step 428: {'lr': 0.00010675, 'samples': 82176, 'steps': 427, 'loss/train': 5.345945358276367} +11/06/2021 21:20:14 - INFO - __main__ - Step 429: {'lr': 0.000107, 'samples': 82368, 'steps': 428, 'loss/train': 5.066455841064453} +11/06/2021 21:20:14 - INFO - __main__ - Step 430: {'lr': 0.00010725, 'samples': 82560, 'steps': 429, 'loss/train': 3.3696258068084717} +11/06/2021 21:20:15 - INFO - __main__ - Step 431: {'lr': 0.0001075, 'samples': 82752, 'steps': 430, 'loss/train': 4.334190845489502} +11/06/2021 21:20:15 - INFO - __main__ - Step 432: {'lr': 0.00010775, 'samples': 82944, 'steps': 431, 'loss/train': 5.169923305511475} +11/06/2021 21:20:16 - INFO - __main__ - Step 433: {'lr': 0.000108, 'samples': 83136, 'steps': 432, 'loss/train': 5.3268537521362305} +11/06/2021 21:20:16 - INFO - __main__ - Step 434: {'lr': 0.00010825, 'samples': 83328, 'steps': 433, 'loss/train': 5.3919854164123535} +11/06/2021 21:20:16 - INFO - __main__ - Step 435: {'lr': 0.00010850000000000001, 'samples': 83520, 'steps': 434, 'loss/train': 5.3725810050964355} +11/06/2021 21:20:17 - INFO - __main__ - Step 436: {'lr': 0.00010875, 'samples': 83712, 'steps': 435, 'loss/train': 5.403895854949951} +11/06/2021 21:20:18 - INFO - __main__ - Step 437: {'lr': 0.000109, 'samples': 83904, 'steps': 436, 'loss/train': 5.205580711364746} +11/06/2021 21:20:18 - INFO - __main__ - Step 438: {'lr': 0.00010925, 'samples': 84096, 'steps': 437, 'loss/train': 5.33302640914917} +11/06/2021 21:20:18 - INFO - __main__ - Step 439: {'lr': 0.0001095, 'samples': 84288, 'steps': 438, 'loss/train': 5.41857385635376} +11/06/2021 21:20:19 - INFO - __main__ - Step 440: {'lr': 0.00010975, 'samples': 84480, 'steps': 439, 'loss/train': 5.0854315757751465} +11/06/2021 21:20:20 - INFO - __main__ - Step 441: {'lr': 0.00011, 'samples': 84672, 'steps': 440, 'loss/train': 4.953428745269775} +11/06/2021 21:20:21 - INFO - __main__ - Step 442: {'lr': 0.00011025, 'samples': 84864, 'steps': 441, 'loss/train': 5.355175495147705} +11/06/2021 21:20:21 - INFO - __main__ - Step 443: {'lr': 0.0001105, 'samples': 85056, 'steps': 442, 'loss/train': 5.322221279144287} +11/06/2021 21:20:21 - INFO - __main__ - Step 444: {'lr': 0.00011075000000000001, 'samples': 85248, 'steps': 443, 'loss/train': 5.694289207458496} +11/06/2021 21:20:22 - INFO - __main__ - Step 445: {'lr': 0.000111, 'samples': 85440, 'steps': 444, 'loss/train': 5.615618705749512} +11/06/2021 21:20:23 - INFO - __main__ - Step 446: {'lr': 0.00011125000000000001, 'samples': 85632, 'steps': 445, 'loss/train': 4.579447269439697} +11/06/2021 21:20:23 - INFO - __main__ - Step 447: {'lr': 0.0001115, 'samples': 85824, 'steps': 446, 'loss/train': 5.4635491371154785} +11/06/2021 21:20:23 - INFO - __main__ - Step 448: {'lr': 0.00011175, 'samples': 86016, 'steps': 447, 'loss/train': 5.6371636390686035} +11/06/2021 21:20:24 - INFO - __main__ - Step 449: {'lr': 0.000112, 'samples': 86208, 'steps': 448, 'loss/train': 5.192485332489014} +11/06/2021 21:20:24 - INFO - __main__ - Step 450: {'lr': 0.00011225, 'samples': 86400, 'steps': 449, 'loss/train': 5.126009464263916} +11/06/2021 21:20:25 - INFO - __main__ - Step 451: {'lr': 0.00011250000000000001, 'samples': 86592, 'steps': 450, 'loss/train': 4.955085754394531} +11/06/2021 21:20:25 - INFO - __main__ - Step 452: {'lr': 0.00011275, 'samples': 86784, 'steps': 451, 'loss/train': 4.919888973236084} +11/06/2021 21:20:26 - INFO - __main__ - Step 453: {'lr': 0.00011300000000000001, 'samples': 86976, 'steps': 452, 'loss/train': 5.37556266784668} +11/06/2021 21:20:26 - INFO - __main__ - Step 454: {'lr': 0.00011325, 'samples': 87168, 'steps': 453, 'loss/train': 5.237241744995117} +11/06/2021 21:20:26 - INFO - __main__ - Step 455: {'lr': 0.00011350000000000001, 'samples': 87360, 'steps': 454, 'loss/train': 4.927133083343506} +11/06/2021 21:20:27 - INFO - __main__ - Step 456: {'lr': 0.00011375, 'samples': 87552, 'steps': 455, 'loss/train': 5.2103400230407715} +11/06/2021 21:20:28 - INFO - __main__ - Step 457: {'lr': 0.000114, 'samples': 87744, 'steps': 456, 'loss/train': 5.820415496826172} +11/06/2021 21:20:28 - INFO - __main__ - Step 458: {'lr': 0.00011425000000000001, 'samples': 87936, 'steps': 457, 'loss/train': 3.8978383541107178} +11/06/2021 21:20:29 - INFO - __main__ - Step 459: {'lr': 0.0001145, 'samples': 88128, 'steps': 458, 'loss/train': 6.301289081573486} +11/06/2021 21:20:29 - INFO - __main__ - Step 460: {'lr': 0.00011475000000000001, 'samples': 88320, 'steps': 459, 'loss/train': 5.069262504577637} +11/06/2021 21:20:30 - INFO - __main__ - Step 461: {'lr': 0.000115, 'samples': 88512, 'steps': 460, 'loss/train': 5.043389320373535} +11/06/2021 21:20:30 - INFO - __main__ - Step 462: {'lr': 0.00011525000000000001, 'samples': 88704, 'steps': 461, 'loss/train': 5.780721664428711} +11/06/2021 21:20:31 - INFO - __main__ - Step 463: {'lr': 0.0001155, 'samples': 88896, 'steps': 462, 'loss/train': 4.882776737213135} +11/06/2021 21:20:31 - INFO - __main__ - Step 464: {'lr': 0.00011575000000000001, 'samples': 89088, 'steps': 463, 'loss/train': 4.844412326812744} +11/06/2021 21:20:31 - INFO - __main__ - Step 465: {'lr': 0.00011600000000000001, 'samples': 89280, 'steps': 464, 'loss/train': 5.012292385101318} +11/06/2021 21:20:32 - INFO - __main__ - Step 466: {'lr': 0.00011625, 'samples': 89472, 'steps': 465, 'loss/train': 5.141354084014893} +11/06/2021 21:20:33 - INFO - __main__ - Step 467: {'lr': 0.00011650000000000001, 'samples': 89664, 'steps': 466, 'loss/train': 5.3636956214904785} +11/06/2021 21:20:33 - INFO - __main__ - Step 468: {'lr': 0.00011675, 'samples': 89856, 'steps': 467, 'loss/train': 5.613701820373535} +11/06/2021 21:20:33 - INFO - __main__ - Step 469: {'lr': 0.00011700000000000001, 'samples': 90048, 'steps': 468, 'loss/train': 4.824275493621826} +11/06/2021 21:20:34 - INFO - __main__ - Step 470: {'lr': 0.00011724999999999999, 'samples': 90240, 'steps': 469, 'loss/train': 4.927989482879639} +11/06/2021 21:20:34 - INFO - __main__ - Step 471: {'lr': 0.0001175, 'samples': 90432, 'steps': 470, 'loss/train': 5.5396223068237305} +11/06/2021 21:20:35 - INFO - __main__ - Step 472: {'lr': 0.00011775, 'samples': 90624, 'steps': 471, 'loss/train': 5.157430648803711} +11/06/2021 21:20:36 - INFO - __main__ - Step 473: {'lr': 0.000118, 'samples': 90816, 'steps': 472, 'loss/train': 4.571201324462891} +11/06/2021 21:20:36 - INFO - __main__ - Step 474: {'lr': 0.00011825, 'samples': 91008, 'steps': 473, 'loss/train': 5.168905735015869} +11/06/2021 21:20:36 - INFO - __main__ - Step 475: {'lr': 0.0001185, 'samples': 91200, 'steps': 474, 'loss/train': 5.4914021492004395} +11/06/2021 21:20:37 - INFO - __main__ - Step 476: {'lr': 0.00011875, 'samples': 91392, 'steps': 475, 'loss/train': 5.1100382804870605} +11/06/2021 21:20:38 - INFO - __main__ - Step 477: {'lr': 0.00011899999999999999, 'samples': 91584, 'steps': 476, 'loss/train': 5.027097225189209} +11/06/2021 21:20:38 - INFO - __main__ - Step 478: {'lr': 0.00011925, 'samples': 91776, 'steps': 477, 'loss/train': 3.3699212074279785} +11/06/2021 21:20:38 - INFO - __main__ - Step 479: {'lr': 0.00011949999999999999, 'samples': 91968, 'steps': 478, 'loss/train': 5.552117824554443} +11/06/2021 21:20:39 - INFO - __main__ - Step 480: {'lr': 0.00011975, 'samples': 92160, 'steps': 479, 'loss/train': 5.236664295196533} +11/06/2021 21:20:39 - INFO - __main__ - Step 481: {'lr': 0.00012, 'samples': 92352, 'steps': 480, 'loss/train': 5.218561172485352} +11/06/2021 21:20:40 - INFO - __main__ - Step 482: {'lr': 0.00012025, 'samples': 92544, 'steps': 481, 'loss/train': 4.788586139678955} +11/06/2021 21:20:41 - INFO - __main__ - Step 483: {'lr': 0.0001205, 'samples': 92736, 'steps': 482, 'loss/train': 4.982636451721191} +11/06/2021 21:20:41 - INFO - __main__ - Step 484: {'lr': 0.00012075, 'samples': 92928, 'steps': 483, 'loss/train': 4.840455055236816} +11/06/2021 21:20:41 - INFO - __main__ - Step 485: {'lr': 0.000121, 'samples': 93120, 'steps': 484, 'loss/train': 5.3554840087890625} +11/06/2021 21:20:42 - INFO - __main__ - Step 486: {'lr': 0.00012124999999999999, 'samples': 93312, 'steps': 485, 'loss/train': 5.182967185974121} +11/06/2021 21:20:43 - INFO - __main__ - Step 487: {'lr': 0.0001215, 'samples': 93504, 'steps': 486, 'loss/train': 5.115420818328857} +11/06/2021 21:20:43 - INFO - __main__ - Step 488: {'lr': 0.00012175, 'samples': 93696, 'steps': 487, 'loss/train': 5.1655683517456055} +11/06/2021 21:20:43 - INFO - __main__ - Step 489: {'lr': 0.000122, 'samples': 93888, 'steps': 488, 'loss/train': 5.405882835388184} +11/06/2021 21:20:44 - INFO - __main__ - Step 490: {'lr': 0.00012225, 'samples': 94080, 'steps': 489, 'loss/train': 5.127898693084717} +11/06/2021 21:20:44 - INFO - __main__ - Step 491: {'lr': 0.0001225, 'samples': 94272, 'steps': 490, 'loss/train': 5.024046421051025} +11/06/2021 21:20:45 - INFO - __main__ - Step 492: {'lr': 0.00012275, 'samples': 94464, 'steps': 491, 'loss/train': 5.145169734954834} +11/06/2021 21:20:45 - INFO - __main__ - Step 493: {'lr': 0.000123, 'samples': 94656, 'steps': 492, 'loss/train': 4.954655170440674} +11/06/2021 21:20:46 - INFO - __main__ - Step 494: {'lr': 0.00012325000000000001, 'samples': 94848, 'steps': 493, 'loss/train': 5.174392223358154} +11/06/2021 21:20:46 - INFO - __main__ - Step 495: {'lr': 0.0001235, 'samples': 95040, 'steps': 494, 'loss/train': 4.580348014831543} +11/06/2021 21:20:47 - INFO - __main__ - Step 496: {'lr': 0.00012375, 'samples': 95232, 'steps': 495, 'loss/train': 4.821667194366455} +11/06/2021 21:20:47 - INFO - __main__ - Step 497: {'lr': 0.000124, 'samples': 95424, 'steps': 496, 'loss/train': 5.254716873168945} +11/06/2021 21:20:48 - INFO - __main__ - Step 498: {'lr': 0.00012425, 'samples': 95616, 'steps': 497, 'loss/train': 4.732685565948486} +11/06/2021 21:20:48 - INFO - __main__ - Step 499: {'lr': 0.0001245, 'samples': 95808, 'steps': 498, 'loss/train': 5.048670291900635} +11/06/2021 21:20:49 - INFO - __main__ - Step 500: {'lr': 0.00012475, 'samples': 96000, 'steps': 499, 'loss/train': 4.834158420562744} +11/06/2021 21:20:49 - INFO - __main__ - Step 501: {'lr': 0.000125, 'samples': 96192, 'steps': 500, 'loss/train': 5.50537109375} +11/06/2021 21:20:49 - INFO - __main__ - Step 502: {'lr': 0.00012525, 'samples': 96384, 'steps': 501, 'loss/train': 4.96640157699585} +11/06/2021 21:20:50 - INFO - __main__ - Step 503: {'lr': 0.00012550000000000001, 'samples': 96576, 'steps': 502, 'loss/train': 4.255295753479004} +11/06/2021 21:20:51 - INFO - __main__ - Step 504: {'lr': 0.00012575, 'samples': 96768, 'steps': 503, 'loss/train': 3.4102871417999268} +11/06/2021 21:20:51 - INFO - __main__ - Step 505: {'lr': 0.000126, 'samples': 96960, 'steps': 504, 'loss/train': 5.220231056213379} +11/06/2021 21:20:51 - INFO - __main__ - Step 506: {'lr': 0.00012625, 'samples': 97152, 'steps': 505, 'loss/train': 4.843728542327881} +11/06/2021 21:20:52 - INFO - __main__ - Step 507: {'lr': 0.0001265, 'samples': 97344, 'steps': 506, 'loss/train': 4.380231857299805} +11/06/2021 21:20:53 - INFO - __main__ - Step 508: {'lr': 0.00012675, 'samples': 97536, 'steps': 507, 'loss/train': 4.899729251861572} +11/06/2021 21:20:54 - INFO - __main__ - Step 509: {'lr': 0.000127, 'samples': 97728, 'steps': 508, 'loss/train': 4.977561950683594} +11/06/2021 21:20:54 - INFO - __main__ - Step 510: {'lr': 0.00012725, 'samples': 97920, 'steps': 509, 'loss/train': 5.346168518066406} +11/06/2021 21:20:54 - INFO - __main__ - Step 511: {'lr': 0.0001275, 'samples': 98112, 'steps': 510, 'loss/train': 4.873198509216309} +11/06/2021 21:20:55 - INFO - __main__ - Step 512: {'lr': 0.00012775000000000002, 'samples': 98304, 'steps': 511, 'loss/train': 5.125716686248779} +11/06/2021 21:20:56 - INFO - __main__ - Step 513: {'lr': 0.000128, 'samples': 98496, 'steps': 512, 'loss/train': 5.299740314483643} +11/06/2021 21:20:56 - INFO - __main__ - Step 514: {'lr': 0.00012825, 'samples': 98688, 'steps': 513, 'loss/train': 5.17880916595459} +11/06/2021 21:20:57 - INFO - __main__ - Step 515: {'lr': 0.0001285, 'samples': 98880, 'steps': 514, 'loss/train': 5.38531494140625} +11/06/2021 21:20:57 - INFO - __main__ - Step 516: {'lr': 0.00012875, 'samples': 99072, 'steps': 515, 'loss/train': 5.111538410186768} +11/06/2021 21:20:58 - INFO - __main__ - Step 517: {'lr': 0.00012900000000000002, 'samples': 99264, 'steps': 516, 'loss/train': 4.971146583557129} +11/06/2021 21:20:59 - INFO - __main__ - Step 518: {'lr': 0.00012925, 'samples': 99456, 'steps': 517, 'loss/train': 4.8264899253845215} +11/06/2021 21:20:59 - INFO - __main__ - Step 519: {'lr': 0.0001295, 'samples': 99648, 'steps': 518, 'loss/train': 4.728095054626465} +11/06/2021 21:20:59 - INFO - __main__ - Step 520: {'lr': 0.00012975, 'samples': 99840, 'steps': 519, 'loss/train': 4.82402229309082} +11/06/2021 21:21:00 - INFO - __main__ - Step 521: {'lr': 0.00013000000000000002, 'samples': 100032, 'steps': 520, 'loss/train': 4.82277774810791} +11/06/2021 21:21:00 - INFO - __main__ - Step 522: {'lr': 0.00013025, 'samples': 100224, 'steps': 521, 'loss/train': 4.736476898193359} +11/06/2021 21:21:01 - INFO - __main__ - Step 523: {'lr': 0.0001305, 'samples': 100416, 'steps': 522, 'loss/train': 5.3957390785217285} +11/06/2021 21:21:02 - INFO - __main__ - Step 524: {'lr': 0.00013075, 'samples': 100608, 'steps': 523, 'loss/train': 4.804849624633789} +11/06/2021 21:21:02 - INFO - __main__ - Step 525: {'lr': 0.000131, 'samples': 100800, 'steps': 524, 'loss/train': 5.213521957397461} +11/06/2021 21:21:02 - INFO - __main__ - Step 526: {'lr': 0.00013125000000000002, 'samples': 100992, 'steps': 525, 'loss/train': 4.800134181976318} +11/06/2021 21:21:03 - INFO - __main__ - Step 527: {'lr': 0.0001315, 'samples': 101184, 'steps': 526, 'loss/train': 5.979576587677002} +11/06/2021 21:21:04 - INFO - __main__ - Step 528: {'lr': 0.00013175, 'samples': 101376, 'steps': 527, 'loss/train': 4.6841630935668945} +11/06/2021 21:21:04 - INFO - __main__ - Step 529: {'lr': 0.000132, 'samples': 101568, 'steps': 528, 'loss/train': 5.14123010635376} +11/06/2021 21:21:04 - INFO - __main__ - Step 530: {'lr': 0.00013225000000000002, 'samples': 101760, 'steps': 529, 'loss/train': 4.850307941436768} +11/06/2021 21:21:05 - INFO - __main__ - Step 531: {'lr': 0.00013250000000000002, 'samples': 101952, 'steps': 530, 'loss/train': 4.945707321166992} +11/06/2021 21:21:05 - INFO - __main__ - Step 532: {'lr': 0.00013275, 'samples': 102144, 'steps': 531, 'loss/train': 5.073093891143799} +11/06/2021 21:21:06 - INFO - __main__ - Step 533: {'lr': 0.000133, 'samples': 102336, 'steps': 532, 'loss/train': 4.880060195922852} +11/06/2021 21:21:07 - INFO - __main__ - Step 534: {'lr': 0.00013325, 'samples': 102528, 'steps': 533, 'loss/train': 5.960422039031982} +11/06/2021 21:21:07 - INFO - __main__ - Step 535: {'lr': 0.00013350000000000002, 'samples': 102720, 'steps': 534, 'loss/train': 4.578385829925537} +11/06/2021 21:21:07 - INFO - __main__ - Step 536: {'lr': 0.00013375, 'samples': 102912, 'steps': 535, 'loss/train': 5.22959566116333} +11/06/2021 21:21:08 - INFO - __main__ - Step 537: {'lr': 0.000134, 'samples': 103104, 'steps': 536, 'loss/train': 5.195213317871094} +11/06/2021 21:21:08 - INFO - __main__ - Step 538: {'lr': 0.00013425, 'samples': 103296, 'steps': 537, 'loss/train': 5.1764912605285645} +11/06/2021 21:21:09 - INFO - __main__ - Step 539: {'lr': 0.00013450000000000002, 'samples': 103488, 'steps': 538, 'loss/train': 4.329580783843994} +11/06/2021 21:21:09 - INFO - __main__ - Step 540: {'lr': 0.00013475000000000002, 'samples': 103680, 'steps': 539, 'loss/train': 5.327682971954346} +11/06/2021 21:21:10 - INFO - __main__ - Step 541: {'lr': 0.000135, 'samples': 103872, 'steps': 540, 'loss/train': 5.050226211547852} +11/06/2021 21:21:10 - INFO - __main__ - Step 542: {'lr': 0.00013525, 'samples': 104064, 'steps': 541, 'loss/train': 6.563281059265137} +11/06/2021 21:21:10 - INFO - __main__ - Step 543: {'lr': 0.00013550000000000001, 'samples': 104256, 'steps': 542, 'loss/train': 5.260067462921143} +11/06/2021 21:21:12 - INFO - __main__ - Step 544: {'lr': 0.00013575000000000002, 'samples': 104448, 'steps': 543, 'loss/train': 5.054920196533203} +11/06/2021 21:21:12 - INFO - __main__ - Step 545: {'lr': 0.00013600000000000003, 'samples': 104640, 'steps': 544, 'loss/train': 4.304242134094238} +11/06/2021 21:21:12 - INFO - __main__ - Step 546: {'lr': 0.00013625, 'samples': 104832, 'steps': 545, 'loss/train': 5.143182277679443} +11/06/2021 21:21:13 - INFO - __main__ - Step 547: {'lr': 0.0001365, 'samples': 105024, 'steps': 546, 'loss/train': 5.063644886016846} +11/06/2021 21:21:13 - INFO - __main__ - Step 548: {'lr': 0.00013675000000000002, 'samples': 105216, 'steps': 547, 'loss/train': 4.523825168609619} +11/06/2021 21:21:14 - INFO - __main__ - Step 549: {'lr': 0.00013700000000000002, 'samples': 105408, 'steps': 548, 'loss/train': 5.415563583374023} +11/06/2021 21:21:14 - INFO - __main__ - Step 550: {'lr': 0.00013725, 'samples': 105600, 'steps': 549, 'loss/train': 5.242093086242676} +11/06/2021 21:21:15 - INFO - __main__ - Step 551: {'lr': 0.0001375, 'samples': 105792, 'steps': 550, 'loss/train': 5.3217949867248535} +11/06/2021 21:21:15 - INFO - __main__ - Step 552: {'lr': 0.00013775000000000001, 'samples': 105984, 'steps': 551, 'loss/train': 4.965686798095703} +11/06/2021 21:21:15 - INFO - __main__ - Step 553: {'lr': 0.00013800000000000002, 'samples': 106176, 'steps': 552, 'loss/train': 4.69637393951416} +11/06/2021 21:21:16 - INFO - __main__ - Step 554: {'lr': 0.00013825000000000003, 'samples': 106368, 'steps': 553, 'loss/train': 5.67413854598999} +11/06/2021 21:21:17 - INFO - __main__ - Step 555: {'lr': 0.0001385, 'samples': 106560, 'steps': 554, 'loss/train': 1.4391024112701416} +11/06/2021 21:21:17 - INFO - __main__ - Step 556: {'lr': 0.00013875, 'samples': 106752, 'steps': 555, 'loss/train': 4.693598747253418} +11/06/2021 21:21:18 - INFO - __main__ - Step 557: {'lr': 0.00013900000000000002, 'samples': 106944, 'steps': 556, 'loss/train': 4.811655521392822} +11/06/2021 21:21:18 - INFO - __main__ - Step 558: {'lr': 0.00013925000000000002, 'samples': 107136, 'steps': 557, 'loss/train': 5.708633899688721} +11/06/2021 21:21:18 - INFO - __main__ - Step 559: {'lr': 0.0001395, 'samples': 107328, 'steps': 558, 'loss/train': 5.34543514251709} +11/06/2021 21:21:19 - INFO - __main__ - Step 560: {'lr': 0.00013975, 'samples': 107520, 'steps': 559, 'loss/train': 4.994585990905762} +11/06/2021 21:21:20 - INFO - __main__ - Step 561: {'lr': 0.00014000000000000001, 'samples': 107712, 'steps': 560, 'loss/train': 4.977428913116455} +11/06/2021 21:21:20 - INFO - __main__ - Step 562: {'lr': 0.00014025000000000002, 'samples': 107904, 'steps': 561, 'loss/train': 5.134328365325928} +11/06/2021 21:21:20 - INFO - __main__ - Step 563: {'lr': 0.00014050000000000003, 'samples': 108096, 'steps': 562, 'loss/train': 5.075902462005615} +11/06/2021 21:21:21 - INFO - __main__ - Step 564: {'lr': 0.00014074999999999998, 'samples': 108288, 'steps': 563, 'loss/train': 4.605697154998779} +11/06/2021 21:21:22 - INFO - __main__ - Step 565: {'lr': 0.00014099999999999998, 'samples': 108480, 'steps': 564, 'loss/train': 4.873136520385742} +11/06/2021 21:21:22 - INFO - __main__ - Step 566: {'lr': 0.00014125, 'samples': 108672, 'steps': 565, 'loss/train': 4.94666862487793} +11/06/2021 21:21:22 - INFO - __main__ - Step 567: {'lr': 0.0001415, 'samples': 108864, 'steps': 566, 'loss/train': 4.661070823669434} +11/06/2021 21:21:23 - INFO - __main__ - Step 568: {'lr': 0.00014175, 'samples': 109056, 'steps': 567, 'loss/train': 5.004296779632568} +11/06/2021 21:21:23 - INFO - __main__ - Step 569: {'lr': 0.00014199999999999998, 'samples': 109248, 'steps': 568, 'loss/train': 4.945058345794678} +11/06/2021 21:21:24 - INFO - __main__ - Step 570: {'lr': 0.00014225, 'samples': 109440, 'steps': 569, 'loss/train': 4.626468658447266} +11/06/2021 21:21:25 - INFO - __main__ - Step 571: {'lr': 0.0001425, 'samples': 109632, 'steps': 570, 'loss/train': 4.994494915008545} +11/06/2021 21:21:25 - INFO - __main__ - Step 572: {'lr': 0.00014275, 'samples': 109824, 'steps': 571, 'loss/train': 5.284569263458252} +11/06/2021 21:21:26 - INFO - __main__ - Step 573: {'lr': 0.00014299999999999998, 'samples': 110016, 'steps': 572, 'loss/train': 5.315004348754883} +11/06/2021 21:21:26 - INFO - __main__ - Step 574: {'lr': 0.00014324999999999999, 'samples': 110208, 'steps': 573, 'loss/train': 4.810165882110596} +11/06/2021 21:21:27 - INFO - __main__ - Step 575: {'lr': 0.0001435, 'samples': 110400, 'steps': 574, 'loss/train': 5.227445125579834} +11/06/2021 21:21:27 - INFO - __main__ - Step 576: {'lr': 0.00014375, 'samples': 110592, 'steps': 575, 'loss/train': 5.34274435043335} +11/06/2021 21:21:28 - INFO - __main__ - Step 577: {'lr': 0.000144, 'samples': 110784, 'steps': 576, 'loss/train': 5.176715850830078} +11/06/2021 21:21:28 - INFO - __main__ - Step 578: {'lr': 0.00014424999999999998, 'samples': 110976, 'steps': 577, 'loss/train': 4.281363487243652} +11/06/2021 21:21:28 - INFO - __main__ - Step 579: {'lr': 0.0001445, 'samples': 111168, 'steps': 578, 'loss/train': 5.460202217102051} +11/06/2021 21:21:29 - INFO - __main__ - Step 580: {'lr': 0.00014475, 'samples': 111360, 'steps': 579, 'loss/train': 5.397484302520752} +11/06/2021 21:21:30 - INFO - __main__ - Step 581: {'lr': 0.000145, 'samples': 111552, 'steps': 580, 'loss/train': 4.4818291664123535} +11/06/2021 21:21:30 - INFO - __main__ - Step 582: {'lr': 0.00014524999999999998, 'samples': 111744, 'steps': 581, 'loss/train': 4.609002590179443} +11/06/2021 21:21:31 - INFO - __main__ - Step 583: {'lr': 0.00014549999999999999, 'samples': 111936, 'steps': 582, 'loss/train': 5.447309970855713} +11/06/2021 21:21:31 - INFO - __main__ - Step 584: {'lr': 0.00014575, 'samples': 112128, 'steps': 583, 'loss/train': 5.413631439208984} +11/06/2021 21:21:32 - INFO - __main__ - Step 585: {'lr': 0.000146, 'samples': 112320, 'steps': 584, 'loss/train': 6.304897308349609} +11/06/2021 21:21:32 - INFO - __main__ - Step 586: {'lr': 0.00014625, 'samples': 112512, 'steps': 585, 'loss/train': 3.9225189685821533} +11/06/2021 21:21:33 - INFO - __main__ - Step 587: {'lr': 0.00014649999999999998, 'samples': 112704, 'steps': 586, 'loss/train': 4.575343132019043} +11/06/2021 21:21:33 - INFO - __main__ - Step 588: {'lr': 0.00014675, 'samples': 112896, 'steps': 587, 'loss/train': 4.97996711730957} +11/06/2021 21:21:34 - INFO - __main__ - Step 589: {'lr': 0.000147, 'samples': 113088, 'steps': 588, 'loss/train': 5.520531177520752} +11/06/2021 21:21:35 - INFO - __main__ - Step 590: {'lr': 0.00014725, 'samples': 113280, 'steps': 589, 'loss/train': 4.435773849487305} +11/06/2021 21:21:35 - INFO - __main__ - Step 591: {'lr': 0.0001475, 'samples': 113472, 'steps': 590, 'loss/train': 5.016930103302002} +11/06/2021 21:21:35 - INFO - __main__ - Step 592: {'lr': 0.00014774999999999999, 'samples': 113664, 'steps': 591, 'loss/train': 4.882648468017578} +11/06/2021 21:21:36 - INFO - __main__ - Step 593: {'lr': 0.000148, 'samples': 113856, 'steps': 592, 'loss/train': 6.573506832122803} +11/06/2021 21:21:36 - INFO - __main__ - Step 594: {'lr': 0.00014825, 'samples': 114048, 'steps': 593, 'loss/train': 4.22829532623291} +11/06/2021 21:21:36 - INFO - __main__ - Step 595: {'lr': 0.0001485, 'samples': 114240, 'steps': 594, 'loss/train': 4.915690898895264} +11/06/2021 21:21:37 - INFO - __main__ - Step 596: {'lr': 0.00014874999999999998, 'samples': 114432, 'steps': 595, 'loss/train': 4.756763458251953} +11/06/2021 21:21:38 - INFO - __main__ - Step 597: {'lr': 0.000149, 'samples': 114624, 'steps': 596, 'loss/train': 4.910470485687256} +11/06/2021 21:21:38 - INFO - __main__ - Step 598: {'lr': 0.00014925, 'samples': 114816, 'steps': 597, 'loss/train': 4.912417411804199} +11/06/2021 21:21:38 - INFO - __main__ - Step 599: {'lr': 0.0001495, 'samples': 115008, 'steps': 598, 'loss/train': 4.568467140197754} +11/06/2021 21:21:39 - INFO - __main__ - Step 600: {'lr': 0.00014975, 'samples': 115200, 'steps': 599, 'loss/train': 4.727468967437744} +11/06/2021 21:21:40 - INFO - __main__ - Step 601: {'lr': 0.00015, 'samples': 115392, 'steps': 600, 'loss/train': 4.731727123260498} +11/06/2021 21:21:40 - INFO - __main__ - Step 602: {'lr': 0.00015025, 'samples': 115584, 'steps': 601, 'loss/train': 5.941672325134277} +11/06/2021 21:21:41 - INFO - __main__ - Step 603: {'lr': 0.0001505, 'samples': 115776, 'steps': 602, 'loss/train': 4.752991676330566} +11/06/2021 21:21:41 - INFO - __main__ - Step 604: {'lr': 0.00015075, 'samples': 115968, 'steps': 603, 'loss/train': 4.749768257141113} +11/06/2021 21:21:41 - INFO - __main__ - Step 605: {'lr': 0.000151, 'samples': 116160, 'steps': 604, 'loss/train': 4.868316650390625} +11/06/2021 21:21:43 - INFO - __main__ - Step 606: {'lr': 0.00015125, 'samples': 116352, 'steps': 605, 'loss/train': 4.696784973144531} +11/06/2021 21:21:43 - INFO - __main__ - Step 607: {'lr': 0.0001515, 'samples': 116544, 'steps': 606, 'loss/train': 5.38928747177124} +11/06/2021 21:21:43 - INFO - __main__ - Step 608: {'lr': 0.00015175, 'samples': 116736, 'steps': 607, 'loss/train': 4.822604179382324} +11/06/2021 21:21:44 - INFO - __main__ - Step 609: {'lr': 0.000152, 'samples': 116928, 'steps': 608, 'loss/train': 4.739031791687012} +11/06/2021 21:21:44 - INFO - __main__ - Step 610: {'lr': 0.00015225, 'samples': 117120, 'steps': 609, 'loss/train': 4.78218412399292} +11/06/2021 21:21:44 - INFO - __main__ - Step 611: {'lr': 0.0001525, 'samples': 117312, 'steps': 610, 'loss/train': 5.469936370849609} +11/06/2021 21:21:46 - INFO - __main__ - Step 612: {'lr': 0.00015275, 'samples': 117504, 'steps': 611, 'loss/train': 5.018012523651123} +11/06/2021 21:21:46 - INFO - __main__ - Step 613: {'lr': 0.000153, 'samples': 117696, 'steps': 612, 'loss/train': 4.723076343536377} +11/06/2021 21:21:46 - INFO - __main__ - Step 614: {'lr': 0.00015325, 'samples': 117888, 'steps': 613, 'loss/train': 4.444612503051758} +11/06/2021 21:21:47 - INFO - __main__ - Step 615: {'lr': 0.0001535, 'samples': 118080, 'steps': 614, 'loss/train': 5.002647876739502} +11/06/2021 21:21:47 - INFO - __main__ - Step 616: {'lr': 0.00015375, 'samples': 118272, 'steps': 615, 'loss/train': 5.234433174133301} +11/06/2021 21:21:48 - INFO - __main__ - Step 617: {'lr': 0.000154, 'samples': 118464, 'steps': 616, 'loss/train': 5.180642604827881} +11/06/2021 21:21:48 - INFO - __main__ - Step 618: {'lr': 0.00015425, 'samples': 118656, 'steps': 617, 'loss/train': 4.186741828918457} +11/06/2021 21:21:49 - INFO - __main__ - Step 619: {'lr': 0.00015450000000000001, 'samples': 118848, 'steps': 618, 'loss/train': 4.601840019226074} +11/06/2021 21:21:49 - INFO - __main__ - Step 620: {'lr': 0.00015475, 'samples': 119040, 'steps': 619, 'loss/train': 5.070303440093994} +11/06/2021 21:21:50 - INFO - __main__ - Step 621: {'lr': 0.000155, 'samples': 119232, 'steps': 620, 'loss/train': 4.981260776519775} +11/06/2021 21:21:50 - INFO - __main__ - Step 622: {'lr': 0.00015525, 'samples': 119424, 'steps': 621, 'loss/train': 4.912421703338623} +11/06/2021 21:21:51 - INFO - __main__ - Step 623: {'lr': 0.0001555, 'samples': 119616, 'steps': 622, 'loss/train': 4.604945182800293} +11/06/2021 21:21:51 - INFO - __main__ - Step 624: {'lr': 0.00015575, 'samples': 119808, 'steps': 623, 'loss/train': 4.606297969818115} +11/06/2021 21:21:52 - INFO - __main__ - Step 625: {'lr': 0.000156, 'samples': 120000, 'steps': 624, 'loss/train': 4.950876235961914} +11/06/2021 21:21:52 - INFO - __main__ - Step 626: {'lr': 0.00015625, 'samples': 120192, 'steps': 625, 'loss/train': 4.56068229675293} +11/06/2021 21:21:52 - INFO - __main__ - Step 627: {'lr': 0.0001565, 'samples': 120384, 'steps': 626, 'loss/train': 4.22480583190918} +11/06/2021 21:21:53 - INFO - __main__ - Step 628: {'lr': 0.00015675000000000002, 'samples': 120576, 'steps': 627, 'loss/train': 5.061352729797363} +11/06/2021 21:21:54 - INFO - __main__ - Step 629: {'lr': 0.000157, 'samples': 120768, 'steps': 628, 'loss/train': 4.828984260559082} +11/06/2021 21:21:54 - INFO - __main__ - Step 630: {'lr': 0.00015725, 'samples': 120960, 'steps': 629, 'loss/train': 4.675282955169678} +11/06/2021 21:21:55 - INFO - __main__ - Step 631: {'lr': 0.0001575, 'samples': 121152, 'steps': 630, 'loss/train': 4.3496575355529785} +11/06/2021 21:21:55 - INFO - __main__ - Step 632: {'lr': 0.00015775, 'samples': 121344, 'steps': 631, 'loss/train': 4.719287872314453} +11/06/2021 21:21:56 - INFO - __main__ - Step 633: {'lr': 0.000158, 'samples': 121536, 'steps': 632, 'loss/train': 4.833708763122559} +11/06/2021 21:21:56 - INFO - __main__ - Step 634: {'lr': 0.00015825, 'samples': 121728, 'steps': 633, 'loss/train': 4.082372665405273} +11/06/2021 21:21:57 - INFO - __main__ - Step 635: {'lr': 0.0001585, 'samples': 121920, 'steps': 634, 'loss/train': 4.89099645614624} +11/06/2021 21:21:57 - INFO - __main__ - Step 636: {'lr': 0.00015875, 'samples': 122112, 'steps': 635, 'loss/train': 5.596816062927246} +11/06/2021 21:21:57 - INFO - __main__ - Step 637: {'lr': 0.00015900000000000002, 'samples': 122304, 'steps': 636, 'loss/train': 4.681394100189209} +11/06/2021 21:21:58 - INFO - __main__ - Step 638: {'lr': 0.00015925, 'samples': 122496, 'steps': 637, 'loss/train': 4.834127426147461} +11/06/2021 21:21:59 - INFO - __main__ - Step 639: {'lr': 0.0001595, 'samples': 122688, 'steps': 638, 'loss/train': 5.277633190155029} +11/06/2021 21:21:59 - INFO - __main__ - Step 640: {'lr': 0.00015975, 'samples': 122880, 'steps': 639, 'loss/train': 5.002859115600586} +11/06/2021 21:21:59 - INFO - __main__ - Step 641: {'lr': 0.00016, 'samples': 123072, 'steps': 640, 'loss/train': 5.2396440505981445} +11/06/2021 21:22:00 - INFO - __main__ - Step 642: {'lr': 0.00016025000000000002, 'samples': 123264, 'steps': 641, 'loss/train': 5.183033466339111} +11/06/2021 21:22:01 - INFO - __main__ - Step 643: {'lr': 0.0001605, 'samples': 123456, 'steps': 642, 'loss/train': 4.6580305099487305} +11/06/2021 21:22:01 - INFO - __main__ - Step 644: {'lr': 0.00016075, 'samples': 123648, 'steps': 643, 'loss/train': 4.906527519226074} +11/06/2021 21:22:02 - INFO - __main__ - Step 645: {'lr': 0.000161, 'samples': 123840, 'steps': 644, 'loss/train': 4.350686073303223} +11/06/2021 21:22:02 - INFO - __main__ - Step 646: {'lr': 0.00016125000000000002, 'samples': 124032, 'steps': 645, 'loss/train': 4.576035499572754} +11/06/2021 21:22:02 - INFO - __main__ - Step 647: {'lr': 0.0001615, 'samples': 124224, 'steps': 646, 'loss/train': 4.445610046386719} +11/06/2021 21:22:03 - INFO - __main__ - Step 648: {'lr': 0.00016175, 'samples': 124416, 'steps': 647, 'loss/train': 4.549352645874023} +11/06/2021 21:22:04 - INFO - __main__ - Step 649: {'lr': 0.000162, 'samples': 124608, 'steps': 648, 'loss/train': 4.443591117858887} +11/06/2021 21:22:04 - INFO - __main__ - Step 650: {'lr': 0.00016225000000000001, 'samples': 124800, 'steps': 649, 'loss/train': 4.2263288497924805} +11/06/2021 21:22:04 - INFO - __main__ - Step 651: {'lr': 0.00016250000000000002, 'samples': 124992, 'steps': 650, 'loss/train': 4.449684143066406} +11/06/2021 21:22:05 - INFO - __main__ - Step 652: {'lr': 0.00016275, 'samples': 125184, 'steps': 651, 'loss/train': 5.221400737762451} +11/06/2021 21:22:06 - INFO - __main__ - Step 653: {'lr': 0.000163, 'samples': 125376, 'steps': 652, 'loss/train': 5.1638994216918945} +11/06/2021 21:22:06 - INFO - __main__ - Step 654: {'lr': 0.00016325, 'samples': 125568, 'steps': 653, 'loss/train': 4.728190898895264} +11/06/2021 21:22:06 - INFO - __main__ - Step 655: {'lr': 0.00016350000000000002, 'samples': 125760, 'steps': 654, 'loss/train': 4.6709394454956055} +11/06/2021 21:22:07 - INFO - __main__ - Step 656: {'lr': 0.00016375000000000002, 'samples': 125952, 'steps': 655, 'loss/train': 4.627468109130859} +11/06/2021 21:22:07 - INFO - __main__ - Step 657: {'lr': 0.000164, 'samples': 126144, 'steps': 656, 'loss/train': 4.362966060638428} +11/06/2021 21:22:08 - INFO - __main__ - Step 658: {'lr': 0.00016425, 'samples': 126336, 'steps': 657, 'loss/train': 5.120889663696289} +11/06/2021 21:22:08 - INFO - __main__ - Step 659: {'lr': 0.00016450000000000001, 'samples': 126528, 'steps': 658, 'loss/train': 4.917827129364014} +11/06/2021 21:22:09 - INFO - __main__ - Step 660: {'lr': 0.00016475000000000002, 'samples': 126720, 'steps': 659, 'loss/train': 4.704123020172119} +11/06/2021 21:22:09 - INFO - __main__ - Step 661: {'lr': 0.000165, 'samples': 126912, 'steps': 660, 'loss/train': 4.710036277770996} +11/06/2021 21:22:10 - INFO - __main__ - Step 662: {'lr': 0.00016525, 'samples': 127104, 'steps': 661, 'loss/train': 4.979597091674805} +11/06/2021 21:22:10 - INFO - __main__ - Step 663: {'lr': 0.0001655, 'samples': 127296, 'steps': 662, 'loss/train': 4.606518268585205} +11/06/2021 21:22:11 - INFO - __main__ - Step 664: {'lr': 0.00016575000000000002, 'samples': 127488, 'steps': 663, 'loss/train': 4.490879058837891} +11/06/2021 21:22:11 - INFO - __main__ - Step 665: {'lr': 0.00016600000000000002, 'samples': 127680, 'steps': 664, 'loss/train': 4.3809075355529785} +11/06/2021 21:22:12 - INFO - __main__ - Step 666: {'lr': 0.00016625, 'samples': 127872, 'steps': 665, 'loss/train': 4.735256195068359} +11/06/2021 21:22:12 - INFO - __main__ - Step 667: {'lr': 0.0001665, 'samples': 128064, 'steps': 666, 'loss/train': 4.7257890701293945} +11/06/2021 21:22:12 - INFO - __main__ - Step 668: {'lr': 0.00016675000000000001, 'samples': 128256, 'steps': 667, 'loss/train': 4.959212303161621} +11/06/2021 21:22:13 - INFO - __main__ - Step 669: {'lr': 0.00016700000000000002, 'samples': 128448, 'steps': 668, 'loss/train': 4.34332275390625} +11/06/2021 21:22:14 - INFO - __main__ - Step 670: {'lr': 0.00016725000000000003, 'samples': 128640, 'steps': 669, 'loss/train': 4.633439064025879} +11/06/2021 21:22:14 - INFO - __main__ - Step 671: {'lr': 0.0001675, 'samples': 128832, 'steps': 670, 'loss/train': 4.631658554077148} +11/06/2021 21:22:15 - INFO - __main__ - Step 672: {'lr': 0.00016775, 'samples': 129024, 'steps': 671, 'loss/train': 4.435437202453613} +11/06/2021 21:22:15 - INFO - __main__ - Step 673: {'lr': 0.00016800000000000002, 'samples': 129216, 'steps': 672, 'loss/train': 3.3415842056274414} +11/06/2021 21:22:16 - INFO - __main__ - Step 674: {'lr': 0.00016825000000000002, 'samples': 129408, 'steps': 673, 'loss/train': 4.65171480178833} +11/06/2021 21:22:16 - INFO - __main__ - Step 675: {'lr': 0.0001685, 'samples': 129600, 'steps': 674, 'loss/train': 4.98203182220459} +11/06/2021 21:22:17 - INFO - __main__ - Step 676: {'lr': 0.00016875, 'samples': 129792, 'steps': 675, 'loss/train': 5.456784248352051} +11/06/2021 21:22:17 - INFO - __main__ - Step 677: {'lr': 0.00016900000000000002, 'samples': 129984, 'steps': 676, 'loss/train': 4.679195880889893} +11/06/2021 21:22:17 - INFO - __main__ - Step 678: {'lr': 0.00016925000000000002, 'samples': 130176, 'steps': 677, 'loss/train': 4.434994697570801} +11/06/2021 21:22:18 - INFO - __main__ - Step 679: {'lr': 0.00016950000000000003, 'samples': 130368, 'steps': 678, 'loss/train': 4.650574684143066} +11/06/2021 21:22:19 - INFO - __main__ - Step 680: {'lr': 0.00016975, 'samples': 130560, 'steps': 679, 'loss/train': 4.444644451141357} +11/06/2021 21:22:19 - INFO - __main__ - Step 681: {'lr': 0.00017, 'samples': 130752, 'steps': 680, 'loss/train': 4.423855781555176} +11/06/2021 21:22:20 - INFO - __main__ - Step 682: {'lr': 0.00017025000000000002, 'samples': 130944, 'steps': 681, 'loss/train': 4.7202301025390625} +11/06/2021 21:22:20 - INFO - __main__ - Step 683: {'lr': 0.00017050000000000002, 'samples': 131136, 'steps': 682, 'loss/train': 4.4818854331970215} +11/06/2021 21:22:21 - INFO - __main__ - Step 684: {'lr': 0.00017075, 'samples': 131328, 'steps': 683, 'loss/train': 5.359105587005615} +11/06/2021 21:22:21 - INFO - __main__ - Step 685: {'lr': 0.000171, 'samples': 131520, 'steps': 684, 'loss/train': 4.730793476104736} +11/06/2021 21:22:22 - INFO - __main__ - Step 686: {'lr': 0.00017125000000000002, 'samples': 131712, 'steps': 685, 'loss/train': 4.558211803436279} +11/06/2021 21:22:22 - INFO - __main__ - Step 687: {'lr': 0.00017150000000000002, 'samples': 131904, 'steps': 686, 'loss/train': 4.429317951202393} +11/06/2021 21:22:22 - INFO - __main__ - Step 688: {'lr': 0.00017175000000000003, 'samples': 132096, 'steps': 687, 'loss/train': 4.6293816566467285} +11/06/2021 21:22:24 - INFO - __main__ - Step 689: {'lr': 0.00017199999999999998, 'samples': 132288, 'steps': 688, 'loss/train': 5.065909385681152} +11/06/2021 21:22:24 - INFO - __main__ - Step 690: {'lr': 0.00017224999999999999, 'samples': 132480, 'steps': 689, 'loss/train': 4.581766605377197} +11/06/2021 21:22:24 - INFO - __main__ - Step 691: {'lr': 0.0001725, 'samples': 132672, 'steps': 690, 'loss/train': 4.165865421295166} +11/06/2021 21:22:25 - INFO - __main__ - Step 692: {'lr': 0.00017275, 'samples': 132864, 'steps': 691, 'loss/train': 4.4996209144592285} +11/06/2021 21:22:25 - INFO - __main__ - Step 693: {'lr': 0.000173, 'samples': 133056, 'steps': 692, 'loss/train': 4.5448150634765625} +11/06/2021 21:22:25 - INFO - __main__ - Step 694: {'lr': 0.00017324999999999998, 'samples': 133248, 'steps': 693, 'loss/train': 3.898272752761841} +11/06/2021 21:22:26 - INFO - __main__ - Step 695: {'lr': 0.0001735, 'samples': 133440, 'steps': 694, 'loss/train': 4.2713165283203125} +11/06/2021 21:22:27 - INFO - __main__ - Step 696: {'lr': 0.00017375, 'samples': 133632, 'steps': 695, 'loss/train': 5.151446342468262} +11/06/2021 21:22:27 - INFO - __main__ - Step 697: {'lr': 0.000174, 'samples': 133824, 'steps': 696, 'loss/train': 4.418706893920898} +11/06/2021 21:22:28 - INFO - __main__ - Step 698: {'lr': 0.00017424999999999998, 'samples': 134016, 'steps': 697, 'loss/train': 4.960476875305176} +11/06/2021 21:22:28 - INFO - __main__ - Step 699: {'lr': 0.00017449999999999999, 'samples': 134208, 'steps': 698, 'loss/train': 4.722470760345459} +11/06/2021 21:22:30 - INFO - __main__ - Step 700: {'lr': 0.00017475, 'samples': 134400, 'steps': 699, 'loss/train': 4.800037384033203} +11/06/2021 21:22:30 - INFO - __main__ - Step 701: {'lr': 0.000175, 'samples': 134592, 'steps': 700, 'loss/train': 4.3655500411987305} +11/06/2021 21:22:30 - INFO - __main__ - Step 702: {'lr': 0.00017525, 'samples': 134784, 'steps': 701, 'loss/train': 4.725539684295654} +11/06/2021 21:22:31 - INFO - __main__ - Step 703: {'lr': 0.00017549999999999998, 'samples': 134976, 'steps': 702, 'loss/train': 4.290457248687744} +11/06/2021 21:22:31 - INFO - __main__ - Step 704: {'lr': 0.00017575, 'samples': 135168, 'steps': 703, 'loss/train': 4.849248886108398} +11/06/2021 21:22:31 - INFO - __main__ - Step 705: {'lr': 0.000176, 'samples': 135360, 'steps': 704, 'loss/train': 2.431931734085083} +11/06/2021 21:22:32 - INFO - __main__ - Step 706: {'lr': 0.00017625, 'samples': 135552, 'steps': 705, 'loss/train': 2.3060343265533447} +11/06/2021 21:22:33 - INFO - __main__ - Step 707: {'lr': 0.00017649999999999998, 'samples': 135744, 'steps': 706, 'loss/train': 2.4550411701202393} +11/06/2021 21:22:33 - INFO - __main__ - Step 708: {'lr': 0.00017675, 'samples': 135936, 'steps': 707, 'loss/train': 4.702536106109619} +11/06/2021 21:22:33 - INFO - __main__ - Step 709: {'lr': 0.000177, 'samples': 136128, 'steps': 708, 'loss/train': 4.986819267272949} +11/06/2021 21:22:34 - INFO - __main__ - Step 710: {'lr': 0.00017725, 'samples': 136320, 'steps': 709, 'loss/train': 4.857694149017334} +11/06/2021 21:22:34 - INFO - __main__ - Step 711: {'lr': 0.0001775, 'samples': 136512, 'steps': 710, 'loss/train': 4.735157012939453} +11/06/2021 21:22:35 - INFO - __main__ - Step 712: {'lr': 0.00017774999999999998, 'samples': 136704, 'steps': 711, 'loss/train': 4.753922462463379} +11/06/2021 21:22:36 - INFO - __main__ - Step 713: {'lr': 0.000178, 'samples': 136896, 'steps': 712, 'loss/train': 4.611956596374512} +11/06/2021 21:22:36 - INFO - __main__ - Step 714: {'lr': 0.00017825, 'samples': 137088, 'steps': 713, 'loss/train': 4.634572982788086} +11/06/2021 21:22:36 - INFO - __main__ - Step 715: {'lr': 0.0001785, 'samples': 137280, 'steps': 714, 'loss/train': 4.737353801727295} +11/06/2021 21:22:37 - INFO - __main__ - Step 716: {'lr': 0.00017875, 'samples': 137472, 'steps': 715, 'loss/train': 4.557127475738525} +11/06/2021 21:22:38 - INFO - __main__ - Step 717: {'lr': 0.000179, 'samples': 137664, 'steps': 716, 'loss/train': 5.090901851654053} +11/06/2021 21:22:38 - INFO - __main__ - Step 718: {'lr': 0.00017925, 'samples': 137856, 'steps': 717, 'loss/train': 4.926265716552734} +11/06/2021 21:22:39 - INFO - __main__ - Step 719: {'lr': 0.0001795, 'samples': 138048, 'steps': 718, 'loss/train': 4.575839519500732} +11/06/2021 21:22:39 - INFO - __main__ - Step 720: {'lr': 0.00017975, 'samples': 138240, 'steps': 719, 'loss/train': 4.539857864379883} +11/06/2021 21:22:39 - INFO - __main__ - Step 721: {'lr': 0.00017999999999999998, 'samples': 138432, 'steps': 720, 'loss/train': 5.017696380615234} +11/06/2021 21:22:41 - INFO - __main__ - Step 722: {'lr': 0.00018025, 'samples': 138624, 'steps': 721, 'loss/train': 4.860723495483398} +11/06/2021 21:22:41 - INFO - __main__ - Step 723: {'lr': 0.0001805, 'samples': 138816, 'steps': 722, 'loss/train': 4.767000675201416} +11/06/2021 21:22:41 - INFO - __main__ - Step 724: {'lr': 0.00018075, 'samples': 139008, 'steps': 723, 'loss/train': 4.792560577392578} +11/06/2021 21:22:42 - INFO - __main__ - Step 725: {'lr': 0.000181, 'samples': 139200, 'steps': 724, 'loss/train': 4.775363922119141} +11/06/2021 21:22:42 - INFO - __main__ - Step 726: {'lr': 0.00018125, 'samples': 139392, 'steps': 725, 'loss/train': 4.8343377113342285} +11/06/2021 21:22:42 - INFO - __main__ - Step 727: {'lr': 0.0001815, 'samples': 139584, 'steps': 726, 'loss/train': 4.501916885375977} +11/06/2021 21:22:43 - INFO - __main__ - Step 728: {'lr': 0.00018175, 'samples': 139776, 'steps': 727, 'loss/train': 4.543506145477295} +11/06/2021 21:22:44 - INFO - __main__ - Step 729: {'lr': 0.000182, 'samples': 139968, 'steps': 728, 'loss/train': 4.346724033355713} +11/06/2021 21:22:44 - INFO - __main__ - Step 730: {'lr': 0.00018225, 'samples': 140160, 'steps': 729, 'loss/train': 4.893301486968994} +11/06/2021 21:22:44 - INFO - __main__ - Step 731: {'lr': 0.0001825, 'samples': 140352, 'steps': 730, 'loss/train': 4.508211612701416} +11/06/2021 21:22:45 - INFO - __main__ - Step 732: {'lr': 0.00018275, 'samples': 140544, 'steps': 731, 'loss/train': 4.329798221588135} +11/06/2021 21:22:46 - INFO - __main__ - Step 733: {'lr': 0.000183, 'samples': 140736, 'steps': 732, 'loss/train': 4.946159362792969} +11/06/2021 21:22:46 - INFO - __main__ - Step 734: {'lr': 0.00018325, 'samples': 140928, 'steps': 733, 'loss/train': 4.753419399261475} +11/06/2021 21:22:47 - INFO - __main__ - Step 735: {'lr': 0.0001835, 'samples': 141120, 'steps': 734, 'loss/train': 5.069578170776367} +11/06/2021 21:22:47 - INFO - __main__ - Step 736: {'lr': 0.00018375, 'samples': 141312, 'steps': 735, 'loss/train': 5.126845359802246} +11/06/2021 21:22:47 - INFO - __main__ - Step 737: {'lr': 0.000184, 'samples': 141504, 'steps': 736, 'loss/train': 4.666621685028076} +11/06/2021 21:22:48 - INFO - __main__ - Step 738: {'lr': 0.00018425, 'samples': 141696, 'steps': 737, 'loss/train': 4.2837958335876465} +11/06/2021 21:22:49 - INFO - __main__ - Step 739: {'lr': 0.0001845, 'samples': 141888, 'steps': 738, 'loss/train': 4.565089702606201} +11/06/2021 21:22:49 - INFO - __main__ - Step 740: {'lr': 0.00018475, 'samples': 142080, 'steps': 739, 'loss/train': 4.330541133880615} +11/06/2021 21:22:49 - INFO - __main__ - Step 741: {'lr': 0.000185, 'samples': 142272, 'steps': 740, 'loss/train': 4.524784564971924} +11/06/2021 21:22:50 - INFO - __main__ - Step 742: {'lr': 0.00018525, 'samples': 142464, 'steps': 741, 'loss/train': 4.280323505401611} +11/06/2021 21:22:51 - INFO - __main__ - Step 743: {'lr': 0.0001855, 'samples': 142656, 'steps': 742, 'loss/train': 4.447424411773682} +11/06/2021 21:22:51 - INFO - __main__ - Step 744: {'lr': 0.00018575000000000002, 'samples': 142848, 'steps': 743, 'loss/train': 4.917816638946533} +11/06/2021 21:22:51 - INFO - __main__ - Step 745: {'lr': 0.000186, 'samples': 143040, 'steps': 744, 'loss/train': 4.4243059158325195} +11/06/2021 21:22:52 - INFO - __main__ - Step 746: {'lr': 0.00018625, 'samples': 143232, 'steps': 745, 'loss/train': 5.763511657714844} +11/06/2021 21:22:52 - INFO - __main__ - Step 747: {'lr': 0.0001865, 'samples': 143424, 'steps': 746, 'loss/train': 4.306034564971924} +11/06/2021 21:22:53 - INFO - __main__ - Step 748: {'lr': 0.00018675, 'samples': 143616, 'steps': 747, 'loss/train': 5.227732181549072} +11/06/2021 21:22:54 - INFO - __main__ - Step 749: {'lr': 0.000187, 'samples': 143808, 'steps': 748, 'loss/train': 5.433281421661377} +11/06/2021 21:22:54 - INFO - __main__ - Step 750: {'lr': 0.00018725, 'samples': 144000, 'steps': 749, 'loss/train': 4.236339092254639} +11/06/2021 21:22:54 - INFO - __main__ - Step 751: {'lr': 0.0001875, 'samples': 144192, 'steps': 750, 'loss/train': 4.570340633392334} +11/06/2021 21:22:55 - INFO - __main__ - Step 752: {'lr': 0.00018775, 'samples': 144384, 'steps': 751, 'loss/train': 4.103482723236084} +11/06/2021 21:22:55 - INFO - __main__ - Step 753: {'lr': 0.00018800000000000002, 'samples': 144576, 'steps': 752, 'loss/train': 4.504870891571045} +11/06/2021 21:22:56 - INFO - __main__ - Step 754: {'lr': 0.00018825, 'samples': 144768, 'steps': 753, 'loss/train': 4.6825480461120605} +11/06/2021 21:22:57 - INFO - __main__ - Step 755: {'lr': 0.0001885, 'samples': 144960, 'steps': 754, 'loss/train': 4.360548973083496} +11/06/2021 21:22:57 - INFO - __main__ - Step 756: {'lr': 0.00018875, 'samples': 145152, 'steps': 755, 'loss/train': 4.626955032348633} +11/06/2021 21:22:57 - INFO - __main__ - Step 757: {'lr': 0.000189, 'samples': 145344, 'steps': 756, 'loss/train': 4.462242126464844} +11/06/2021 21:22:58 - INFO - __main__ - Step 758: {'lr': 0.00018925, 'samples': 145536, 'steps': 757, 'loss/train': 4.262608528137207} +11/06/2021 21:22:59 - INFO - __main__ - Step 759: {'lr': 0.0001895, 'samples': 145728, 'steps': 758, 'loss/train': 4.549057960510254} +11/06/2021 21:22:59 - INFO - __main__ - Step 760: {'lr': 0.00018975, 'samples': 145920, 'steps': 759, 'loss/train': 4.4868574142456055} +11/06/2021 21:22:59 - INFO - __main__ - Step 761: {'lr': 0.00019, 'samples': 146112, 'steps': 760, 'loss/train': 4.394392013549805} +11/06/2021 21:23:00 - INFO - __main__ - Step 762: {'lr': 0.00019025000000000002, 'samples': 146304, 'steps': 761, 'loss/train': 4.9143500328063965} +11/06/2021 21:23:00 - INFO - __main__ - Step 763: {'lr': 0.0001905, 'samples': 146496, 'steps': 762, 'loss/train': 4.456435680389404} +11/06/2021 21:23:01 - INFO - __main__ - Step 764: {'lr': 0.00019075, 'samples': 146688, 'steps': 763, 'loss/train': 5.696299076080322} +11/06/2021 21:23:02 - INFO - __main__ - Step 765: {'lr': 0.000191, 'samples': 146880, 'steps': 764, 'loss/train': 4.935421466827393} +11/06/2021 21:23:02 - INFO - __main__ - Step 766: {'lr': 0.00019125000000000001, 'samples': 147072, 'steps': 765, 'loss/train': 4.943374156951904} +11/06/2021 21:23:02 - INFO - __main__ - Step 767: {'lr': 0.00019150000000000002, 'samples': 147264, 'steps': 766, 'loss/train': 5.322519302368164} +11/06/2021 21:23:03 - INFO - __main__ - Step 768: {'lr': 0.00019175, 'samples': 147456, 'steps': 767, 'loss/train': 4.189104080200195} +11/06/2021 21:23:04 - INFO - __main__ - Step 769: {'lr': 0.000192, 'samples': 147648, 'steps': 768, 'loss/train': 5.1701979637146} +11/06/2021 21:23:04 - INFO - __main__ - Step 770: {'lr': 0.00019225, 'samples': 147840, 'steps': 769, 'loss/train': 4.428781032562256} +11/06/2021 21:23:04 - INFO - __main__ - Step 771: {'lr': 0.00019250000000000002, 'samples': 148032, 'steps': 770, 'loss/train': 4.415109157562256} +11/06/2021 21:23:05 - INFO - __main__ - Step 772: {'lr': 0.00019275, 'samples': 148224, 'steps': 771, 'loss/train': 4.811757564544678} +11/06/2021 21:23:05 - INFO - __main__ - Step 773: {'lr': 0.000193, 'samples': 148416, 'steps': 772, 'loss/train': 4.7581634521484375} +11/06/2021 21:23:06 - INFO - __main__ - Step 774: {'lr': 0.00019325, 'samples': 148608, 'steps': 773, 'loss/train': 4.4999098777771} +11/06/2021 21:23:06 - INFO - __main__ - Step 775: {'lr': 0.00019350000000000001, 'samples': 148800, 'steps': 774, 'loss/train': 4.690352439880371} +11/06/2021 21:23:07 - INFO - __main__ - Step 776: {'lr': 0.00019375000000000002, 'samples': 148992, 'steps': 775, 'loss/train': 4.419637203216553} +11/06/2021 21:23:07 - INFO - __main__ - Step 777: {'lr': 0.000194, 'samples': 149184, 'steps': 776, 'loss/train': 4.947287559509277} +11/06/2021 21:23:08 - INFO - __main__ - Step 778: {'lr': 0.00019425, 'samples': 149376, 'steps': 777, 'loss/train': 5.457443714141846} +11/06/2021 21:23:09 - INFO - __main__ - Step 779: {'lr': 0.0001945, 'samples': 149568, 'steps': 778, 'loss/train': 4.38627815246582} +11/06/2021 21:23:09 - INFO - __main__ - Step 780: {'lr': 0.00019475000000000002, 'samples': 149760, 'steps': 779, 'loss/train': 5.3790178298950195} +11/06/2021 21:23:09 - INFO - __main__ - Step 781: {'lr': 0.00019500000000000002, 'samples': 149952, 'steps': 780, 'loss/train': 4.04803466796875} +11/06/2021 21:23:10 - INFO - __main__ - Step 782: {'lr': 0.00019525, 'samples': 150144, 'steps': 781, 'loss/train': 4.558263301849365} +11/06/2021 21:23:10 - INFO - __main__ - Step 783: {'lr': 0.0001955, 'samples': 150336, 'steps': 782, 'loss/train': 4.308804988861084} +11/06/2021 21:23:11 - INFO - __main__ - Step 784: {'lr': 0.00019575000000000001, 'samples': 150528, 'steps': 783, 'loss/train': 5.033785820007324} +11/06/2021 21:23:11 - INFO - __main__ - Step 785: {'lr': 0.00019600000000000002, 'samples': 150720, 'steps': 784, 'loss/train': 4.059752464294434} +11/06/2021 21:23:12 - INFO - __main__ - Step 786: {'lr': 0.00019625, 'samples': 150912, 'steps': 785, 'loss/train': 4.140824317932129} +11/06/2021 21:23:12 - INFO - __main__ - Step 787: {'lr': 0.0001965, 'samples': 151104, 'steps': 786, 'loss/train': 4.625868797302246} +11/06/2021 21:23:12 - INFO - __main__ - Step 788: {'lr': 0.00019675, 'samples': 151296, 'steps': 787, 'loss/train': 4.85765266418457} +11/06/2021 21:23:14 - INFO - __main__ - Step 789: {'lr': 0.00019700000000000002, 'samples': 151488, 'steps': 788, 'loss/train': 4.904588222503662} +11/06/2021 21:23:14 - INFO - __main__ - Step 790: {'lr': 0.00019725000000000002, 'samples': 151680, 'steps': 789, 'loss/train': 4.804408550262451} +11/06/2021 21:23:14 - INFO - __main__ - Step 791: {'lr': 0.0001975, 'samples': 151872, 'steps': 790, 'loss/train': 4.8462114334106445} +11/06/2021 21:23:15 - INFO - __main__ - Step 792: {'lr': 0.00019775, 'samples': 152064, 'steps': 791, 'loss/train': 4.475534439086914} +11/06/2021 21:23:15 - INFO - __main__ - Step 793: {'lr': 0.00019800000000000002, 'samples': 152256, 'steps': 792, 'loss/train': 4.764225482940674} +11/06/2021 21:23:16 - INFO - __main__ - Step 794: {'lr': 0.00019825000000000002, 'samples': 152448, 'steps': 793, 'loss/train': 4.824385643005371} +11/06/2021 21:23:16 - INFO - __main__ - Step 795: {'lr': 0.00019850000000000003, 'samples': 152640, 'steps': 794, 'loss/train': 4.384396076202393} +11/06/2021 21:23:17 - INFO - __main__ - Step 796: {'lr': 0.00019875, 'samples': 152832, 'steps': 795, 'loss/train': 4.154908657073975} +11/06/2021 21:23:17 - INFO - __main__ - Step 797: {'lr': 0.000199, 'samples': 153024, 'steps': 796, 'loss/train': 4.558513641357422} +11/06/2021 21:23:18 - INFO - __main__ - Step 798: {'lr': 0.00019925000000000002, 'samples': 153216, 'steps': 797, 'loss/train': 4.913057327270508} +11/06/2021 21:23:18 - INFO - __main__ - Step 799: {'lr': 0.00019950000000000002, 'samples': 153408, 'steps': 798, 'loss/train': 4.051199913024902} +11/06/2021 21:23:20 - INFO - __main__ - Step 800: {'lr': 0.00019975, 'samples': 153600, 'steps': 799, 'loss/train': 3.938993215560913} +11/06/2021 21:23:20 - INFO - __main__ - Step 801: {'lr': 0.0002, 'samples': 153792, 'steps': 800, 'loss/train': 4.724459648132324} +11/06/2021 21:23:20 - INFO - __main__ - Step 802: {'lr': 0.00020025000000000002, 'samples': 153984, 'steps': 801, 'loss/train': 6.338046550750732} +11/06/2021 21:23:21 - INFO - __main__ - Step 803: {'lr': 0.00020050000000000002, 'samples': 154176, 'steps': 802, 'loss/train': 2.221121072769165} +11/06/2021 21:23:21 - INFO - __main__ - Step 804: {'lr': 0.00020075000000000003, 'samples': 154368, 'steps': 803, 'loss/train': 2.2776834964752197} +11/06/2021 21:23:21 - INFO - __main__ - Step 805: {'lr': 0.000201, 'samples': 154560, 'steps': 804, 'loss/train': 2.1242752075195312} +11/06/2021 21:23:22 - INFO - __main__ - Step 806: {'lr': 0.00020125, 'samples': 154752, 'steps': 805, 'loss/train': 3.73689603805542} +11/06/2021 21:23:23 - INFO - __main__ - Step 807: {'lr': 0.00020150000000000002, 'samples': 154944, 'steps': 806, 'loss/train': 4.354226112365723} +11/06/2021 21:23:23 - INFO - __main__ - Step 808: {'lr': 0.00020175000000000003, 'samples': 155136, 'steps': 807, 'loss/train': 4.5094475746154785} +11/06/2021 21:23:24 - INFO - __main__ - Step 809: {'lr': 0.000202, 'samples': 155328, 'steps': 808, 'loss/train': 4.677899360656738} +11/06/2021 21:23:24 - INFO - __main__ - Step 810: {'lr': 0.00020225, 'samples': 155520, 'steps': 809, 'loss/train': 4.373321533203125} +11/06/2021 21:23:25 - INFO - __main__ - Step 811: {'lr': 0.00020250000000000002, 'samples': 155712, 'steps': 810, 'loss/train': 5.149594306945801} +11/06/2021 21:23:26 - INFO - __main__ - Step 812: {'lr': 0.00020275000000000002, 'samples': 155904, 'steps': 811, 'loss/train': 4.3080902099609375} +11/06/2021 21:23:26 - INFO - __main__ - Step 813: {'lr': 0.00020300000000000003, 'samples': 156096, 'steps': 812, 'loss/train': 4.42739725112915} +11/06/2021 21:23:26 - INFO - __main__ - Step 814: {'lr': 0.00020324999999999998, 'samples': 156288, 'steps': 813, 'loss/train': 4.6587677001953125} +11/06/2021 21:23:27 - INFO - __main__ - Step 815: {'lr': 0.00020349999999999999, 'samples': 156480, 'steps': 814, 'loss/train': 4.584706783294678} +11/06/2021 21:23:27 - INFO - __main__ - Step 816: {'lr': 0.00020375, 'samples': 156672, 'steps': 815, 'loss/train': 4.675464153289795} +11/06/2021 21:23:28 - INFO - __main__ - Step 817: {'lr': 0.000204, 'samples': 156864, 'steps': 816, 'loss/train': 4.275284767150879} +11/06/2021 21:23:28 - INFO - __main__ - Step 818: {'lr': 0.00020425, 'samples': 157056, 'steps': 817, 'loss/train': 4.487129211425781} +11/06/2021 21:23:29 - INFO - __main__ - Step 819: {'lr': 0.00020449999999999998, 'samples': 157248, 'steps': 818, 'loss/train': 3.8839242458343506} +11/06/2021 21:23:29 - INFO - __main__ - Step 820: {'lr': 0.00020475, 'samples': 157440, 'steps': 819, 'loss/train': 5.175144672393799} +11/06/2021 21:23:30 - INFO - __main__ - Step 821: {'lr': 0.000205, 'samples': 157632, 'steps': 820, 'loss/train': 4.6907877922058105} +11/06/2021 21:23:31 - INFO - __main__ - Step 822: {'lr': 0.00020525, 'samples': 157824, 'steps': 821, 'loss/train': 5.107820987701416} +11/06/2021 21:23:31 - INFO - __main__ - Step 823: {'lr': 0.00020549999999999998, 'samples': 158016, 'steps': 822, 'loss/train': 4.4801106452941895} +11/06/2021 21:23:31 - INFO - __main__ - Step 824: {'lr': 0.00020575, 'samples': 158208, 'steps': 823, 'loss/train': 4.510085105895996} +11/06/2021 21:23:32 - INFO - __main__ - Step 825: {'lr': 0.000206, 'samples': 158400, 'steps': 824, 'loss/train': 4.396790981292725} +11/06/2021 21:23:32 - INFO - __main__ - Step 826: {'lr': 0.00020625, 'samples': 158592, 'steps': 825, 'loss/train': 4.010310649871826} +11/06/2021 21:23:32 - INFO - __main__ - Step 827: {'lr': 0.0002065, 'samples': 158784, 'steps': 826, 'loss/train': 4.797766208648682} +11/06/2021 21:23:33 - INFO - __main__ - Step 828: {'lr': 0.00020674999999999998, 'samples': 158976, 'steps': 827, 'loss/train': 4.619658470153809} +11/06/2021 21:23:34 - INFO - __main__ - Step 829: {'lr': 0.000207, 'samples': 159168, 'steps': 828, 'loss/train': 4.163397312164307} +11/06/2021 21:23:34 - INFO - __main__ - Step 830: {'lr': 0.00020725, 'samples': 159360, 'steps': 829, 'loss/train': 4.228115081787109} +11/06/2021 21:23:34 - INFO - __main__ - Step 831: {'lr': 0.0002075, 'samples': 159552, 'steps': 830, 'loss/train': 4.451252460479736} +11/06/2021 21:23:35 - INFO - __main__ - Step 832: {'lr': 0.00020774999999999998, 'samples': 159744, 'steps': 831, 'loss/train': 4.284130096435547} +11/06/2021 21:23:36 - INFO - __main__ - Step 833: {'lr': 0.000208, 'samples': 159936, 'steps': 832, 'loss/train': 4.7883687019348145} +11/06/2021 21:23:36 - INFO - __main__ - Step 834: {'lr': 0.00020825, 'samples': 160128, 'steps': 833, 'loss/train': 4.043850898742676} +11/06/2021 21:23:37 - INFO - __main__ - Step 835: {'lr': 0.0002085, 'samples': 160320, 'steps': 834, 'loss/train': 4.566141128540039} +11/06/2021 21:23:37 - INFO - __main__ - Step 836: {'lr': 0.00020875, 'samples': 160512, 'steps': 835, 'loss/train': 5.373464584350586} +11/06/2021 21:23:37 - INFO - __main__ - Step 837: {'lr': 0.00020899999999999998, 'samples': 160704, 'steps': 836, 'loss/train': 4.873067378997803} +11/06/2021 21:23:39 - INFO - __main__ - Step 838: {'lr': 0.00020925, 'samples': 160896, 'steps': 837, 'loss/train': 4.9676995277404785} +11/06/2021 21:23:39 - INFO - __main__ - Step 839: {'lr': 0.0002095, 'samples': 161088, 'steps': 838, 'loss/train': 4.646881103515625} +11/06/2021 21:23:39 - INFO - __main__ - Step 840: {'lr': 0.00020975, 'samples': 161280, 'steps': 839, 'loss/train': 4.013716220855713} +11/06/2021 21:23:40 - INFO - __main__ - Step 841: {'lr': 0.00021, 'samples': 161472, 'steps': 840, 'loss/train': 6.019371509552002} +11/06/2021 21:23:40 - INFO - __main__ - Step 842: {'lr': 0.00021025, 'samples': 161664, 'steps': 841, 'loss/train': 3.9948506355285645} +11/06/2021 21:23:41 - INFO - __main__ - Step 843: {'lr': 0.0002105, 'samples': 161856, 'steps': 842, 'loss/train': 4.164978504180908} +11/06/2021 21:23:42 - INFO - __main__ - Step 844: {'lr': 0.00021075, 'samples': 162048, 'steps': 843, 'loss/train': 4.208803176879883} +11/06/2021 21:23:42 - INFO - __main__ - Step 845: {'lr': 0.000211, 'samples': 162240, 'steps': 844, 'loss/train': 5.149277210235596} +11/06/2021 21:23:42 - INFO - __main__ - Step 846: {'lr': 0.00021124999999999998, 'samples': 162432, 'steps': 845, 'loss/train': 4.742812156677246} +11/06/2021 21:23:43 - INFO - __main__ - Step 847: {'lr': 0.0002115, 'samples': 162624, 'steps': 846, 'loss/train': 4.207589149475098} +11/06/2021 21:23:43 - INFO - __main__ - Step 848: {'lr': 0.00021175, 'samples': 162816, 'steps': 847, 'loss/train': 4.035452842712402} +11/06/2021 21:23:44 - INFO - __main__ - Step 849: {'lr': 0.000212, 'samples': 163008, 'steps': 848, 'loss/train': 4.860066890716553} +11/06/2021 21:23:45 - INFO - __main__ - Step 850: {'lr': 0.00021225, 'samples': 163200, 'steps': 849, 'loss/train': 3.371035575866699} +11/06/2021 21:23:45 - INFO - __main__ - Step 851: {'lr': 0.0002125, 'samples': 163392, 'steps': 850, 'loss/train': 4.5741753578186035} +11/06/2021 21:23:45 - INFO - __main__ - Step 852: {'lr': 0.00021275, 'samples': 163584, 'steps': 851, 'loss/train': 4.537678241729736} +11/06/2021 21:23:46 - INFO - __main__ - Step 853: {'lr': 0.000213, 'samples': 163776, 'steps': 852, 'loss/train': 4.552616119384766} +11/06/2021 21:23:47 - INFO - __main__ - Step 854: {'lr': 0.00021325, 'samples': 163968, 'steps': 853, 'loss/train': 4.6721577644348145} +11/06/2021 21:23:47 - INFO - __main__ - Step 855: {'lr': 0.0002135, 'samples': 164160, 'steps': 854, 'loss/train': 4.655636310577393} +11/06/2021 21:23:47 - INFO - __main__ - Step 856: {'lr': 0.00021375, 'samples': 164352, 'steps': 855, 'loss/train': 4.305333614349365} +11/06/2021 21:23:48 - INFO - __main__ - Step 857: {'lr': 0.000214, 'samples': 164544, 'steps': 856, 'loss/train': 4.127890110015869} +11/06/2021 21:23:48 - INFO - __main__ - Step 858: {'lr': 0.00021425, 'samples': 164736, 'steps': 857, 'loss/train': 4.549274921417236} +11/06/2021 21:23:49 - INFO - __main__ - Step 859: {'lr': 0.0002145, 'samples': 164928, 'steps': 858, 'loss/train': 3.803431510925293} +11/06/2021 21:23:50 - INFO - __main__ - Step 860: {'lr': 0.00021475, 'samples': 165120, 'steps': 859, 'loss/train': 4.316712379455566} +11/06/2021 21:23:50 - INFO - __main__ - Step 861: {'lr': 0.000215, 'samples': 165312, 'steps': 860, 'loss/train': 4.917266845703125} +11/06/2021 21:23:50 - INFO - __main__ - Step 862: {'lr': 0.00021525, 'samples': 165504, 'steps': 861, 'loss/train': 4.41719913482666} +11/06/2021 21:23:51 - INFO - __main__ - Step 863: {'lr': 0.0002155, 'samples': 165696, 'steps': 862, 'loss/train': 4.436905384063721} +11/06/2021 21:23:52 - INFO - __main__ - Step 864: {'lr': 0.00021575, 'samples': 165888, 'steps': 863, 'loss/train': 4.34383487701416} +11/06/2021 21:23:52 - INFO - __main__ - Step 865: {'lr': 0.000216, 'samples': 166080, 'steps': 864, 'loss/train': 4.4350080490112305} +11/06/2021 21:23:52 - INFO - __main__ - Step 866: {'lr': 0.00021625, 'samples': 166272, 'steps': 865, 'loss/train': 4.548778057098389} +11/06/2021 21:23:53 - INFO - __main__ - Step 867: {'lr': 0.0002165, 'samples': 166464, 'steps': 866, 'loss/train': 4.653875827789307} +11/06/2021 21:23:53 - INFO - __main__ - Step 868: {'lr': 0.00021675, 'samples': 166656, 'steps': 867, 'loss/train': 4.1312150955200195} +11/06/2021 21:23:54 - INFO - __main__ - Step 869: {'lr': 0.00021700000000000002, 'samples': 166848, 'steps': 868, 'loss/train': 4.243196964263916} +11/06/2021 21:23:54 - INFO - __main__ - Step 870: {'lr': 0.00021725, 'samples': 167040, 'steps': 869, 'loss/train': 4.393092155456543} +11/06/2021 21:23:55 - INFO - __main__ - Step 871: {'lr': 0.0002175, 'samples': 167232, 'steps': 870, 'loss/train': 4.559785842895508} +11/06/2021 21:23:55 - INFO - __main__ - Step 872: {'lr': 0.00021775, 'samples': 167424, 'steps': 871, 'loss/train': 1.9217588901519775} +11/06/2021 21:23:55 - INFO - __main__ - Step 873: {'lr': 0.000218, 'samples': 167616, 'steps': 872, 'loss/train': 4.757959365844727} +11/06/2021 21:23:57 - INFO - __main__ - Step 874: {'lr': 0.00021825, 'samples': 167808, 'steps': 873, 'loss/train': 4.589957237243652} +11/06/2021 21:23:57 - INFO - __main__ - Step 875: {'lr': 0.0002185, 'samples': 168000, 'steps': 874, 'loss/train': 4.484537124633789} +11/06/2021 21:23:57 - INFO - __main__ - Step 876: {'lr': 0.00021875, 'samples': 168192, 'steps': 875, 'loss/train': 4.340537071228027} +11/06/2021 21:23:58 - INFO - __main__ - Step 877: {'lr': 0.000219, 'samples': 168384, 'steps': 876, 'loss/train': 4.769442558288574} +11/06/2021 21:23:58 - INFO - __main__ - Step 878: {'lr': 0.00021925000000000002, 'samples': 168576, 'steps': 877, 'loss/train': 4.576560974121094} +11/06/2021 21:23:59 - INFO - __main__ - Step 879: {'lr': 0.0002195, 'samples': 168768, 'steps': 878, 'loss/train': 4.7822418212890625} +11/06/2021 21:23:59 - INFO - __main__ - Step 880: {'lr': 0.00021975, 'samples': 168960, 'steps': 879, 'loss/train': 4.239711284637451} +11/06/2021 21:24:00 - INFO - __main__ - Step 881: {'lr': 0.00022, 'samples': 169152, 'steps': 880, 'loss/train': 4.899833679199219} +11/06/2021 21:24:00 - INFO - __main__ - Step 882: {'lr': 0.00022025000000000001, 'samples': 169344, 'steps': 881, 'loss/train': 4.500170707702637} +11/06/2021 21:24:00 - INFO - __main__ - Step 883: {'lr': 0.0002205, 'samples': 169536, 'steps': 882, 'loss/train': 4.454834938049316} +11/06/2021 21:24:02 - INFO - __main__ - Step 884: {'lr': 0.00022075, 'samples': 169728, 'steps': 883, 'loss/train': 4.347689151763916} +11/06/2021 21:24:02 - INFO - __main__ - Step 885: {'lr': 0.000221, 'samples': 169920, 'steps': 884, 'loss/train': 4.470192909240723} +11/06/2021 21:24:02 - INFO - __main__ - Step 886: {'lr': 0.00022125, 'samples': 170112, 'steps': 885, 'loss/train': 3.8449060916900635} +11/06/2021 21:24:03 - INFO - __main__ - Step 887: {'lr': 0.00022150000000000002, 'samples': 170304, 'steps': 886, 'loss/train': 3.2878403663635254} +11/06/2021 21:24:03 - INFO - __main__ - Step 888: {'lr': 0.00022175, 'samples': 170496, 'steps': 887, 'loss/train': 4.312256813049316} +11/06/2021 21:24:04 - INFO - __main__ - Step 889: {'lr': 0.000222, 'samples': 170688, 'steps': 888, 'loss/train': 4.553658962249756} +11/06/2021 21:24:04 - INFO - __main__ - Step 890: {'lr': 0.00022225, 'samples': 170880, 'steps': 889, 'loss/train': 4.031077861785889} +11/06/2021 21:24:05 - INFO - __main__ - Step 891: {'lr': 0.00022250000000000001, 'samples': 171072, 'steps': 890, 'loss/train': 4.104956150054932} +11/06/2021 21:24:05 - INFO - __main__ - Step 892: {'lr': 0.00022275000000000002, 'samples': 171264, 'steps': 891, 'loss/train': 4.234619617462158} +11/06/2021 21:24:05 - INFO - __main__ - Step 893: {'lr': 0.000223, 'samples': 171456, 'steps': 892, 'loss/train': 3.9380950927734375} +11/06/2021 21:24:06 - INFO - __main__ - Step 894: {'lr': 0.00022325, 'samples': 171648, 'steps': 893, 'loss/train': 3.4913272857666016} +11/06/2021 21:24:07 - INFO - __main__ - Step 895: {'lr': 0.0002235, 'samples': 171840, 'steps': 894, 'loss/train': 2.99515700340271} +11/06/2021 21:24:07 - INFO - __main__ - Step 896: {'lr': 0.00022375000000000002, 'samples': 172032, 'steps': 895, 'loss/train': 4.716649055480957} +11/06/2021 21:24:07 - INFO - __main__ - Step 897: {'lr': 0.000224, 'samples': 172224, 'steps': 896, 'loss/train': 3.291337251663208} +11/06/2021 21:24:08 - INFO - __main__ - Step 898: {'lr': 0.00022425, 'samples': 172416, 'steps': 897, 'loss/train': 4.090959548950195} +11/06/2021 21:24:08 - INFO - __main__ - Step 899: {'lr': 0.0002245, 'samples': 172608, 'steps': 898, 'loss/train': 4.231109142303467} +11/06/2021 21:24:09 - INFO - __main__ - Step 900: {'lr': 0.00022475000000000001, 'samples': 172800, 'steps': 899, 'loss/train': 3.5604536533355713} +11/06/2021 21:24:09 - INFO - __main__ - Step 901: {'lr': 0.00022500000000000002, 'samples': 172992, 'steps': 900, 'loss/train': 4.001966953277588} +11/06/2021 21:24:10 - INFO - __main__ - Step 902: {'lr': 0.00022525, 'samples': 173184, 'steps': 901, 'loss/train': 4.180810928344727} +11/06/2021 21:24:10 - INFO - __main__ - Step 903: {'lr': 0.0002255, 'samples': 173376, 'steps': 902, 'loss/train': 4.559982776641846} +11/06/2021 21:24:11 - INFO - __main__ - Step 904: {'lr': 0.00022575, 'samples': 173568, 'steps': 903, 'loss/train': 4.321451663970947} +11/06/2021 21:24:12 - INFO - __main__ - Step 905: {'lr': 0.00022600000000000002, 'samples': 173760, 'steps': 904, 'loss/train': 4.82120943069458} +11/06/2021 21:24:12 - INFO - __main__ - Step 906: {'lr': 0.00022625000000000002, 'samples': 173952, 'steps': 905, 'loss/train': 4.165206432342529} +11/06/2021 21:24:12 - INFO - __main__ - Step 907: {'lr': 0.0002265, 'samples': 174144, 'steps': 906, 'loss/train': 2.5543439388275146} +11/06/2021 21:24:13 - INFO - __main__ - Step 908: {'lr': 0.00022675, 'samples': 174336, 'steps': 907, 'loss/train': 4.742263317108154} +11/06/2021 21:24:13 - INFO - __main__ - Step 909: {'lr': 0.00022700000000000002, 'samples': 174528, 'steps': 908, 'loss/train': 4.112782001495361} +11/06/2021 21:24:14 - INFO - __main__ - Step 910: {'lr': 0.00022725000000000002, 'samples': 174720, 'steps': 909, 'loss/train': 4.566103458404541} +11/06/2021 21:24:15 - INFO - __main__ - Step 911: {'lr': 0.0002275, 'samples': 174912, 'steps': 910, 'loss/train': 4.344858169555664} +11/06/2021 21:24:15 - INFO - __main__ - Step 912: {'lr': 0.00022775, 'samples': 175104, 'steps': 911, 'loss/train': 3.5020289421081543} +11/06/2021 21:24:15 - INFO - __main__ - Step 913: {'lr': 0.000228, 'samples': 175296, 'steps': 912, 'loss/train': 4.5875163078308105} +11/06/2021 21:24:16 - INFO - __main__ - Step 914: {'lr': 0.00022825000000000002, 'samples': 175488, 'steps': 913, 'loss/train': 4.796538352966309} +11/06/2021 21:24:17 - INFO - __main__ - Step 915: {'lr': 0.00022850000000000002, 'samples': 175680, 'steps': 914, 'loss/train': 4.283998966217041} +11/06/2021 21:24:17 - INFO - __main__ - Step 916: {'lr': 0.00022875, 'samples': 175872, 'steps': 915, 'loss/train': 4.674391746520996} +11/06/2021 21:24:17 - INFO - __main__ - Step 917: {'lr': 0.000229, 'samples': 176064, 'steps': 916, 'loss/train': 5.0381999015808105} +11/06/2021 21:24:18 - INFO - __main__ - Step 918: {'lr': 0.00022925000000000002, 'samples': 176256, 'steps': 917, 'loss/train': 4.393980503082275} +11/06/2021 21:24:18 - INFO - __main__ - Step 919: {'lr': 0.00022950000000000002, 'samples': 176448, 'steps': 918, 'loss/train': 3.857478141784668} +11/06/2021 21:24:19 - INFO - __main__ - Step 920: {'lr': 0.00022975000000000003, 'samples': 176640, 'steps': 919, 'loss/train': 4.180598258972168} +11/06/2021 21:24:19 - INFO - __main__ - Step 921: {'lr': 0.00023, 'samples': 176832, 'steps': 920, 'loss/train': 4.508198261260986} +11/06/2021 21:24:20 - INFO - __main__ - Step 922: {'lr': 0.00023025, 'samples': 177024, 'steps': 921, 'loss/train': 4.902273654937744} +11/06/2021 21:24:20 - INFO - __main__ - Step 923: {'lr': 0.00023050000000000002, 'samples': 177216, 'steps': 922, 'loss/train': 3.9419641494750977} +11/06/2021 21:24:21 - INFO - __main__ - Step 924: {'lr': 0.00023075000000000003, 'samples': 177408, 'steps': 923, 'loss/train': 4.182397365570068} +11/06/2021 21:24:21 - INFO - __main__ - Step 925: {'lr': 0.000231, 'samples': 177600, 'steps': 924, 'loss/train': 5.673306941986084} +11/06/2021 21:24:22 - INFO - __main__ - Step 926: {'lr': 0.00023125, 'samples': 177792, 'steps': 925, 'loss/train': 4.469267845153809} +11/06/2021 21:24:22 - INFO - __main__ - Step 927: {'lr': 0.00023150000000000002, 'samples': 177984, 'steps': 926, 'loss/train': 4.016385078430176} +11/06/2021 21:24:23 - INFO - __main__ - Step 928: {'lr': 0.00023175000000000002, 'samples': 178176, 'steps': 927, 'loss/train': 4.510035037994385} +11/06/2021 21:24:23 - INFO - __main__ - Step 929: {'lr': 0.00023200000000000003, 'samples': 178368, 'steps': 928, 'loss/train': 3.650172233581543} +11/06/2021 21:24:23 - INFO - __main__ - Step 930: {'lr': 0.00023225, 'samples': 178560, 'steps': 929, 'loss/train': 3.8825185298919678} +11/06/2021 21:24:24 - INFO - __main__ - Step 931: {'lr': 0.0002325, 'samples': 178752, 'steps': 930, 'loss/train': 4.376020908355713} +11/06/2021 21:24:25 - INFO - __main__ - Step 932: {'lr': 0.00023275000000000002, 'samples': 178944, 'steps': 931, 'loss/train': 4.174633979797363} +11/06/2021 21:24:25 - INFO - __main__ - Step 933: {'lr': 0.00023300000000000003, 'samples': 179136, 'steps': 932, 'loss/train': 4.296014785766602} +11/06/2021 21:24:25 - INFO - __main__ - Step 934: {'lr': 0.00023325, 'samples': 179328, 'steps': 933, 'loss/train': 3.821877956390381} +11/06/2021 21:24:26 - INFO - __main__ - Step 935: {'lr': 0.0002335, 'samples': 179520, 'steps': 934, 'loss/train': 4.20390510559082} +11/06/2021 21:24:27 - INFO - __main__ - Step 936: {'lr': 0.00023375000000000002, 'samples': 179712, 'steps': 935, 'loss/train': 4.282657623291016} +11/06/2021 21:24:27 - INFO - __main__ - Step 937: {'lr': 0.00023400000000000002, 'samples': 179904, 'steps': 936, 'loss/train': 3.8457953929901123} +11/06/2021 21:24:28 - INFO - __main__ - Step 938: {'lr': 0.00023425000000000003, 'samples': 180096, 'steps': 937, 'loss/train': 4.099065780639648} +11/06/2021 21:24:28 - INFO - __main__ - Step 939: {'lr': 0.00023449999999999998, 'samples': 180288, 'steps': 938, 'loss/train': 4.02554988861084} +11/06/2021 21:24:28 - INFO - __main__ - Step 940: {'lr': 0.00023475, 'samples': 180480, 'steps': 939, 'loss/train': 4.181853294372559} +11/06/2021 21:24:29 - INFO - __main__ - Step 941: {'lr': 0.000235, 'samples': 180672, 'steps': 940, 'loss/train': 4.0363969802856445} +11/06/2021 21:24:30 - INFO - __main__ - Step 942: {'lr': 0.00023525, 'samples': 180864, 'steps': 941, 'loss/train': 4.118391036987305} +11/06/2021 21:24:30 - INFO - __main__ - Step 943: {'lr': 0.0002355, 'samples': 181056, 'steps': 942, 'loss/train': 4.28350830078125} +11/06/2021 21:24:30 - INFO - __main__ - Step 944: {'lr': 0.00023574999999999998, 'samples': 181248, 'steps': 943, 'loss/train': 3.8540680408477783} +11/06/2021 21:24:31 - INFO - __main__ - Step 945: {'lr': 0.000236, 'samples': 181440, 'steps': 944, 'loss/train': 4.089186191558838} +11/06/2021 21:24:32 - INFO - __main__ - Step 946: {'lr': 0.00023625, 'samples': 181632, 'steps': 945, 'loss/train': 4.698647975921631} +11/06/2021 21:24:32 - INFO - __main__ - Step 947: {'lr': 0.0002365, 'samples': 181824, 'steps': 946, 'loss/train': 4.4743123054504395} +11/06/2021 21:24:32 - INFO - __main__ - Step 948: {'lr': 0.00023674999999999998, 'samples': 182016, 'steps': 947, 'loss/train': 4.072103500366211} +11/06/2021 21:24:33 - INFO - __main__ - Step 949: {'lr': 0.000237, 'samples': 182208, 'steps': 948, 'loss/train': 4.225581169128418} +11/06/2021 21:24:33 - INFO - __main__ - Step 950: {'lr': 0.00023725, 'samples': 182400, 'steps': 949, 'loss/train': 4.038322448730469} +11/06/2021 21:24:34 - INFO - __main__ - Step 951: {'lr': 0.0002375, 'samples': 182592, 'steps': 950, 'loss/train': 4.349215984344482} +11/06/2021 21:24:35 - INFO - __main__ - Step 952: {'lr': 0.00023775, 'samples': 182784, 'steps': 951, 'loss/train': 4.141671180725098} +11/06/2021 21:24:35 - INFO - __main__ - Step 953: {'lr': 0.00023799999999999998, 'samples': 182976, 'steps': 952, 'loss/train': 3.437227725982666} +11/06/2021 21:24:35 - INFO - __main__ - Step 954: {'lr': 0.00023825, 'samples': 183168, 'steps': 953, 'loss/train': 4.3065505027771} +11/06/2021 21:24:36 - INFO - __main__ - Step 955: {'lr': 0.0002385, 'samples': 183360, 'steps': 954, 'loss/train': 4.3600687980651855} +11/06/2021 21:24:36 - INFO - __main__ - Step 956: {'lr': 0.00023875, 'samples': 183552, 'steps': 955, 'loss/train': 3.731297731399536} +11/06/2021 21:24:37 - INFO - __main__ - Step 957: {'lr': 0.00023899999999999998, 'samples': 183744, 'steps': 956, 'loss/train': 4.126706600189209} +11/06/2021 21:24:37 - INFO - __main__ - Step 958: {'lr': 0.00023925, 'samples': 183936, 'steps': 957, 'loss/train': 4.03998327255249} +11/06/2021 21:24:38 - INFO - __main__ - Step 959: {'lr': 0.0002395, 'samples': 184128, 'steps': 958, 'loss/train': 4.376034259796143} +11/06/2021 21:24:38 - INFO - __main__ - Step 960: {'lr': 0.00023975, 'samples': 184320, 'steps': 959, 'loss/train': 4.163696765899658} +11/06/2021 21:24:39 - INFO - __main__ - Step 961: {'lr': 0.00024, 'samples': 184512, 'steps': 960, 'loss/train': 3.9525156021118164} +11/06/2021 21:24:40 - INFO - __main__ - Step 962: {'lr': 0.00024024999999999999, 'samples': 184704, 'steps': 961, 'loss/train': 4.245794296264648} +11/06/2021 21:24:40 - INFO - __main__ - Step 963: {'lr': 0.0002405, 'samples': 184896, 'steps': 962, 'loss/train': 4.1179914474487305} +11/06/2021 21:24:41 - INFO - __main__ - Step 964: {'lr': 0.00024075, 'samples': 185088, 'steps': 963, 'loss/train': 3.9547386169433594} +11/06/2021 21:24:41 - INFO - __main__ - Step 965: {'lr': 0.000241, 'samples': 185280, 'steps': 964, 'loss/train': 5.651031494140625} +11/06/2021 21:24:41 - INFO - __main__ - Step 966: {'lr': 0.00024125, 'samples': 185472, 'steps': 965, 'loss/train': 4.45121431350708} +11/06/2021 21:24:42 - INFO - __main__ - Step 967: {'lr': 0.0002415, 'samples': 185664, 'steps': 966, 'loss/train': 4.361720561981201} +11/06/2021 21:24:43 - INFO - __main__ - Step 968: {'lr': 0.00024175, 'samples': 185856, 'steps': 967, 'loss/train': 4.614392280578613} +11/06/2021 21:24:43 - INFO - __main__ - Step 969: {'lr': 0.000242, 'samples': 186048, 'steps': 968, 'loss/train': 4.159306526184082} +11/06/2021 21:24:43 - INFO - __main__ - Step 970: {'lr': 0.00024225, 'samples': 186240, 'steps': 969, 'loss/train': 4.633758544921875} +11/06/2021 21:24:44 - INFO - __main__ - Step 971: {'lr': 0.00024249999999999999, 'samples': 186432, 'steps': 970, 'loss/train': 3.539381742477417} +11/06/2021 21:24:45 - INFO - __main__ - Step 972: {'lr': 0.00024275, 'samples': 186624, 'steps': 971, 'loss/train': 4.320156097412109} +11/06/2021 21:24:45 - INFO - __main__ - Step 973: {'lr': 0.000243, 'samples': 186816, 'steps': 972, 'loss/train': 4.2555952072143555} +11/06/2021 21:24:45 - INFO - __main__ - Step 974: {'lr': 0.00024325, 'samples': 187008, 'steps': 973, 'loss/train': 4.501039505004883} +11/06/2021 21:24:46 - INFO - __main__ - Step 975: {'lr': 0.0002435, 'samples': 187200, 'steps': 974, 'loss/train': 4.149434566497803} +11/06/2021 21:24:46 - INFO - __main__ - Step 976: {'lr': 0.00024375, 'samples': 187392, 'steps': 975, 'loss/train': 4.1013922691345215} +11/06/2021 21:24:47 - INFO - __main__ - Step 977: {'lr': 0.000244, 'samples': 187584, 'steps': 976, 'loss/train': 4.386606216430664} +11/06/2021 21:24:47 - INFO - __main__ - Step 978: {'lr': 0.00024425, 'samples': 187776, 'steps': 977, 'loss/train': 5.693066596984863} +11/06/2021 21:24:48 - INFO - __main__ - Step 979: {'lr': 0.0002445, 'samples': 187968, 'steps': 978, 'loss/train': 4.069120407104492} +11/06/2021 21:24:48 - INFO - __main__ - Step 980: {'lr': 0.00024475, 'samples': 188160, 'steps': 979, 'loss/train': 3.942934513092041} +11/06/2021 21:24:49 - INFO - __main__ - Step 981: {'lr': 0.000245, 'samples': 188352, 'steps': 980, 'loss/train': 4.399833679199219} +11/06/2021 21:24:49 - INFO - __main__ - Step 982: {'lr': 0.00024525, 'samples': 188544, 'steps': 981, 'loss/train': 4.462058067321777} +11/06/2021 21:24:50 - INFO - __main__ - Step 983: {'lr': 0.0002455, 'samples': 188736, 'steps': 982, 'loss/train': 4.437088966369629} +11/06/2021 21:24:50 - INFO - __main__ - Step 984: {'lr': 0.00024575, 'samples': 188928, 'steps': 983, 'loss/train': 3.954718828201294} +11/06/2021 21:24:51 - INFO - __main__ - Step 985: {'lr': 0.000246, 'samples': 189120, 'steps': 984, 'loss/train': 3.88590669631958} +11/06/2021 21:24:51 - INFO - __main__ - Step 986: {'lr': 0.00024625, 'samples': 189312, 'steps': 985, 'loss/train': 4.265262603759766} +11/06/2021 21:24:51 - INFO - __main__ - Step 987: {'lr': 0.00024650000000000003, 'samples': 189504, 'steps': 986, 'loss/train': 3.8113763332366943} +11/06/2021 21:24:52 - INFO - __main__ - Step 988: {'lr': 0.00024675, 'samples': 189696, 'steps': 987, 'loss/train': 4.336015701293945} +11/06/2021 21:24:53 - INFO - __main__ - Step 989: {'lr': 0.000247, 'samples': 189888, 'steps': 988, 'loss/train': 3.8807554244995117} +11/06/2021 21:24:53 - INFO - __main__ - Step 990: {'lr': 0.00024725, 'samples': 190080, 'steps': 989, 'loss/train': 3.6231210231781006} +11/06/2021 21:24:53 - INFO - __main__ - Step 991: {'lr': 0.0002475, 'samples': 190272, 'steps': 990, 'loss/train': 4.3600897789001465} +11/06/2021 21:24:54 - INFO - __main__ - Step 992: {'lr': 0.00024775, 'samples': 190464, 'steps': 991, 'loss/train': 4.003350734710693} +11/06/2021 21:24:55 - INFO - __main__ - Step 993: {'lr': 0.000248, 'samples': 190656, 'steps': 992, 'loss/train': 4.158915996551514} +11/06/2021 21:24:55 - INFO - __main__ - Step 994: {'lr': 0.00024825, 'samples': 190848, 'steps': 993, 'loss/train': 4.062311172485352} +11/06/2021 21:24:55 - INFO - __main__ - Step 995: {'lr': 0.0002485, 'samples': 191040, 'steps': 994, 'loss/train': 4.686992645263672} +11/06/2021 21:24:56 - INFO - __main__ - Step 996: {'lr': 0.00024875, 'samples': 191232, 'steps': 995, 'loss/train': 4.652307510375977} +11/06/2021 21:24:57 - INFO - __main__ - Step 997: {'lr': 0.000249, 'samples': 191424, 'steps': 996, 'loss/train': 4.7089762687683105} +11/06/2021 21:24:57 - INFO - __main__ - Step 998: {'lr': 0.00024925, 'samples': 191616, 'steps': 997, 'loss/train': 4.194471836090088} +11/06/2021 21:24:57 - INFO - __main__ - Step 999: {'lr': 0.0002495, 'samples': 191808, 'steps': 998, 'loss/train': 4.319421768188477} +11/06/2021 21:24:58 - INFO - __main__ - Step 1000: {'lr': 0.00024975, 'samples': 192000, 'steps': 999, 'loss/train': 4.688298225402832} +11/06/2021 21:24:58 - INFO - __main__ - Step 1001: {'lr': 0.00025, 'samples': 192192, 'steps': 1000, 'loss/train': 5.178300857543945} +11/06/2021 21:24:58 - INFO - __main__ - Step 1002: {'lr': 0.00025025, 'samples': 192384, 'steps': 1001, 'loss/train': 4.494810104370117} +11/06/2021 21:25:00 - INFO - __main__ - Step 1003: {'lr': 0.0002505, 'samples': 192576, 'steps': 1002, 'loss/train': 4.467245101928711} +11/06/2021 21:25:00 - INFO - __main__ - Step 1004: {'lr': 0.00025075, 'samples': 192768, 'steps': 1003, 'loss/train': 3.843966484069824} +11/06/2021 21:25:00 - INFO - __main__ - Step 1005: {'lr': 0.00025100000000000003, 'samples': 192960, 'steps': 1004, 'loss/train': 3.936264753341675} +11/06/2021 21:25:01 - INFO - __main__ - Step 1006: {'lr': 0.00025124999999999995, 'samples': 193152, 'steps': 1005, 'loss/train': 2.070441961288452} +11/06/2021 21:25:01 - INFO - __main__ - Step 1007: {'lr': 0.0002515, 'samples': 193344, 'steps': 1006, 'loss/train': 2.1154818534851074} +11/06/2021 21:25:01 - INFO - __main__ - Step 1008: {'lr': 0.00025174999999999997, 'samples': 193536, 'steps': 1007, 'loss/train': 4.228350639343262} +11/06/2021 21:25:02 - INFO - __main__ - Step 1009: {'lr': 0.000252, 'samples': 193728, 'steps': 1008, 'loss/train': 3.9860525131225586} +11/06/2021 21:25:03 - INFO - __main__ - Step 1010: {'lr': 0.00025225, 'samples': 193920, 'steps': 1009, 'loss/train': 4.507659912109375} +11/06/2021 21:25:03 - INFO - __main__ - Step 1011: {'lr': 0.0002525, 'samples': 194112, 'steps': 1010, 'loss/train': 4.104220867156982} +11/06/2021 21:25:04 - INFO - __main__ - Step 1012: {'lr': 0.00025275, 'samples': 194304, 'steps': 1011, 'loss/train': 3.661561965942383} +11/06/2021 21:25:04 - INFO - __main__ - Step 1013: {'lr': 0.000253, 'samples': 194496, 'steps': 1012, 'loss/train': 4.302820682525635} +11/06/2021 21:25:05 - INFO - __main__ - Step 1014: {'lr': 0.00025325, 'samples': 194688, 'steps': 1013, 'loss/train': 4.471502780914307} +11/06/2021 21:25:05 - INFO - __main__ - Step 1015: {'lr': 0.0002535, 'samples': 194880, 'steps': 1014, 'loss/train': 4.165027141571045} +11/06/2021 21:25:06 - INFO - __main__ - Step 1016: {'lr': 0.00025374999999999996, 'samples': 195072, 'steps': 1015, 'loss/train': 3.9462151527404785} +11/06/2021 21:25:06 - INFO - __main__ - Step 1017: {'lr': 0.000254, 'samples': 195264, 'steps': 1016, 'loss/train': 6.699620723724365} +11/06/2021 21:25:06 - INFO - __main__ - Step 1018: {'lr': 0.00025425, 'samples': 195456, 'steps': 1017, 'loss/train': 3.6332051753997803} +11/06/2021 21:25:07 - INFO - __main__ - Step 1019: {'lr': 0.0002545, 'samples': 195648, 'steps': 1018, 'loss/train': 4.286611080169678} +11/06/2021 21:25:08 - INFO - __main__ - Step 1020: {'lr': 0.00025475, 'samples': 195840, 'steps': 1019, 'loss/train': 3.8143672943115234} +11/06/2021 21:25:08 - INFO - __main__ - Step 1021: {'lr': 0.000255, 'samples': 196032, 'steps': 1020, 'loss/train': 3.97232723236084} +11/06/2021 21:25:08 - INFO - __main__ - Step 1022: {'lr': 0.00025525, 'samples': 196224, 'steps': 1021, 'loss/train': 4.28098726272583} +11/06/2021 21:25:09 - INFO - __main__ - Step 1023: {'lr': 0.00025550000000000003, 'samples': 196416, 'steps': 1022, 'loss/train': 4.043383598327637} +11/06/2021 21:25:10 - INFO - __main__ - Step 1024: {'lr': 0.00025575, 'samples': 196608, 'steps': 1023, 'loss/train': 4.659992218017578} +11/06/2021 21:25:10 - INFO - __main__ - Step 1025: {'lr': 0.000256, 'samples': 196800, 'steps': 1024, 'loss/train': 4.093658924102783} +11/06/2021 21:25:10 - INFO - __main__ - Step 1026: {'lr': 0.00025624999999999997, 'samples': 196992, 'steps': 1025, 'loss/train': 3.535585880279541} +11/06/2021 21:25:11 - INFO - __main__ - Step 1027: {'lr': 0.0002565, 'samples': 197184, 'steps': 1026, 'loss/train': 4.1824493408203125} +11/06/2021 21:25:11 - INFO - __main__ - Step 1028: {'lr': 0.00025675, 'samples': 197376, 'steps': 1027, 'loss/train': 4.0930609703063965} +11/06/2021 21:25:11 - INFO - __main__ - Step 1029: {'lr': 0.000257, 'samples': 197568, 'steps': 1028, 'loss/train': 3.6540799140930176} +11/06/2021 21:25:13 - INFO - __main__ - Step 1030: {'lr': 0.00025725, 'samples': 197760, 'steps': 1029, 'loss/train': 4.0925822257995605} +11/06/2021 21:25:13 - INFO - __main__ - Step 1031: {'lr': 0.0002575, 'samples': 197952, 'steps': 1030, 'loss/train': 3.85776424407959} +11/06/2021 21:25:13 - INFO - __main__ - Step 1032: {'lr': 0.00025775, 'samples': 198144, 'steps': 1031, 'loss/train': 4.097292423248291} +11/06/2021 21:25:14 - INFO - __main__ - Step 1033: {'lr': 0.00025800000000000004, 'samples': 198336, 'steps': 1032, 'loss/train': 1.9851371049880981} +11/06/2021 21:25:14 - INFO - __main__ - Step 1034: {'lr': 0.00025824999999999996, 'samples': 198528, 'steps': 1033, 'loss/train': 4.119291305541992} +11/06/2021 21:25:15 - INFO - __main__ - Step 1035: {'lr': 0.0002585, 'samples': 198720, 'steps': 1034, 'loss/train': 4.1994733810424805} +11/06/2021 21:25:15 - INFO - __main__ - Step 1036: {'lr': 0.00025875, 'samples': 198912, 'steps': 1035, 'loss/train': 4.295950412750244} +11/06/2021 21:25:16 - INFO - __main__ - Step 1037: {'lr': 0.000259, 'samples': 199104, 'steps': 1036, 'loss/train': 3.5869834423065186} +11/06/2021 21:25:16 - INFO - __main__ - Step 1038: {'lr': 0.00025925, 'samples': 199296, 'steps': 1037, 'loss/train': 5.716175556182861} +11/06/2021 21:25:16 - INFO - __main__ - Step 1039: {'lr': 0.0002595, 'samples': 199488, 'steps': 1038, 'loss/train': 4.104729175567627} +11/06/2021 21:25:18 - INFO - __main__ - Step 1040: {'lr': 0.00025975, 'samples': 199680, 'steps': 1039, 'loss/train': 4.121339321136475} +11/06/2021 21:25:18 - INFO - __main__ - Step 1041: {'lr': 0.00026000000000000003, 'samples': 199872, 'steps': 1040, 'loss/train': 4.044469356536865} +11/06/2021 21:25:18 - INFO - __main__ - Step 1042: {'lr': 0.00026025, 'samples': 200064, 'steps': 1041, 'loss/train': 4.489924430847168} +11/06/2021 21:25:19 - INFO - __main__ - Step 1043: {'lr': 0.0002605, 'samples': 200256, 'steps': 1042, 'loss/train': 4.626270771026611} +11/06/2021 21:25:19 - INFO - __main__ - Step 1044: {'lr': 0.00026074999999999997, 'samples': 200448, 'steps': 1043, 'loss/train': 3.788095712661743} +11/06/2021 21:25:20 - INFO - __main__ - Step 1045: {'lr': 0.000261, 'samples': 200640, 'steps': 1044, 'loss/train': 4.697029113769531} +11/06/2021 21:25:20 - INFO - __main__ - Step 1046: {'lr': 0.00026125, 'samples': 200832, 'steps': 1045, 'loss/train': 3.7859976291656494} +11/06/2021 21:25:21 - INFO - __main__ - Step 1047: {'lr': 0.0002615, 'samples': 201024, 'steps': 1046, 'loss/train': 4.636324405670166} +11/06/2021 21:25:21 - INFO - __main__ - Step 1048: {'lr': 0.00026175, 'samples': 201216, 'steps': 1047, 'loss/train': 4.295483112335205} +11/06/2021 21:25:21 - INFO - __main__ - Step 1049: {'lr': 0.000262, 'samples': 201408, 'steps': 1048, 'loss/train': 3.938405990600586} +11/06/2021 21:25:22 - INFO - __main__ - Step 1050: {'lr': 0.00026225, 'samples': 201600, 'steps': 1049, 'loss/train': 5.09901762008667} +11/06/2021 21:25:23 - INFO - __main__ - Step 1051: {'lr': 0.00026250000000000004, 'samples': 201792, 'steps': 1050, 'loss/train': 4.2966108322143555} +11/06/2021 21:25:23 - INFO - __main__ - Step 1052: {'lr': 0.00026274999999999996, 'samples': 201984, 'steps': 1051, 'loss/train': 3.858107805252075} +11/06/2021 21:25:23 - INFO - __main__ - Step 1053: {'lr': 0.000263, 'samples': 202176, 'steps': 1052, 'loss/train': 4.3338303565979} +11/06/2021 21:25:24 - INFO - __main__ - Step 1054: {'lr': 0.00026325, 'samples': 202368, 'steps': 1053, 'loss/train': 4.086007118225098} +11/06/2021 21:25:25 - INFO - __main__ - Step 1055: {'lr': 0.0002635, 'samples': 202560, 'steps': 1054, 'loss/train': 3.4907381534576416} +11/06/2021 21:25:25 - INFO - __main__ - Step 1056: {'lr': 0.00026375, 'samples': 202752, 'steps': 1055, 'loss/train': 6.328280925750732} +11/06/2021 21:25:26 - INFO - __main__ - Step 1057: {'lr': 0.000264, 'samples': 202944, 'steps': 1056, 'loss/train': 4.75831413269043} +11/06/2021 21:25:26 - INFO - __main__ - Step 1058: {'lr': 0.00026425, 'samples': 203136, 'steps': 1057, 'loss/train': 4.140725135803223} +11/06/2021 21:25:26 - INFO - __main__ - Step 1059: {'lr': 0.00026450000000000003, 'samples': 203328, 'steps': 1058, 'loss/train': 4.232659339904785} +11/06/2021 21:25:27 - INFO - __main__ - Step 1060: {'lr': 0.00026475, 'samples': 203520, 'steps': 1059, 'loss/train': 3.662130117416382} +11/06/2021 21:25:28 - INFO - __main__ - Step 1061: {'lr': 0.00026500000000000004, 'samples': 203712, 'steps': 1060, 'loss/train': 4.175182819366455} +11/06/2021 21:25:28 - INFO - __main__ - Step 1062: {'lr': 0.00026524999999999997, 'samples': 203904, 'steps': 1061, 'loss/train': 4.066892623901367} +11/06/2021 21:25:28 - INFO - __main__ - Step 1063: {'lr': 0.0002655, 'samples': 204096, 'steps': 1062, 'loss/train': 3.988063335418701} +11/06/2021 21:25:29 - INFO - __main__ - Step 1064: {'lr': 0.00026575, 'samples': 204288, 'steps': 1063, 'loss/train': 5.1581830978393555} +11/06/2021 21:25:29 - INFO - __main__ - Step 1065: {'lr': 0.000266, 'samples': 204480, 'steps': 1064, 'loss/train': 3.77549409866333} +11/06/2021 21:25:30 - INFO - __main__ - Step 1066: {'lr': 0.00026625, 'samples': 204672, 'steps': 1065, 'loss/train': 3.962754011154175} +11/06/2021 21:25:30 - INFO - __main__ - Step 1067: {'lr': 0.0002665, 'samples': 204864, 'steps': 1066, 'loss/train': 4.140915393829346} +11/06/2021 21:25:31 - INFO - __main__ - Step 1068: {'lr': 0.00026675, 'samples': 205056, 'steps': 1067, 'loss/train': 3.9314892292022705} +11/06/2021 21:25:31 - INFO - __main__ - Step 1069: {'lr': 0.00026700000000000004, 'samples': 205248, 'steps': 1068, 'loss/train': 4.5690155029296875} +11/06/2021 21:25:31 - INFO - __main__ - Step 1070: {'lr': 0.00026725, 'samples': 205440, 'steps': 1069, 'loss/train': 2.362624168395996} +11/06/2021 21:25:33 - INFO - __main__ - Step 1071: {'lr': 0.0002675, 'samples': 205632, 'steps': 1070, 'loss/train': 3.6357979774475098} +11/06/2021 21:25:33 - INFO - __main__ - Step 1072: {'lr': 0.00026775, 'samples': 205824, 'steps': 1071, 'loss/train': 4.618821144104004} +11/06/2021 21:25:33 - INFO - __main__ - Step 1073: {'lr': 0.000268, 'samples': 206016, 'steps': 1072, 'loss/train': 3.773068904876709} +11/06/2021 21:25:34 - INFO - __main__ - Step 1074: {'lr': 0.00026825, 'samples': 206208, 'steps': 1073, 'loss/train': 3.240086078643799} +11/06/2021 21:25:34 - INFO - __main__ - Step 1075: {'lr': 0.0002685, 'samples': 206400, 'steps': 1074, 'loss/train': 5.478127479553223} +11/06/2021 21:25:35 - INFO - __main__ - Step 1076: {'lr': 0.00026875, 'samples': 206592, 'steps': 1075, 'loss/train': 4.112662315368652} +11/06/2021 21:25:35 - INFO - __main__ - Step 1077: {'lr': 0.00026900000000000003, 'samples': 206784, 'steps': 1076, 'loss/train': 4.273911476135254} +11/06/2021 21:25:36 - INFO - __main__ - Step 1078: {'lr': 0.00026925, 'samples': 206976, 'steps': 1077, 'loss/train': 4.561737060546875} +11/06/2021 21:25:36 - INFO - __main__ - Step 1079: {'lr': 0.00026950000000000005, 'samples': 207168, 'steps': 1078, 'loss/train': 4.370131015777588} +11/06/2021 21:25:36 - INFO - __main__ - Step 1080: {'lr': 0.00026974999999999997, 'samples': 207360, 'steps': 1079, 'loss/train': 4.151457786560059} +11/06/2021 21:25:37 - INFO - __main__ - Step 1081: {'lr': 0.00027, 'samples': 207552, 'steps': 1080, 'loss/train': 4.187550067901611} +11/06/2021 21:25:38 - INFO - __main__ - Step 1082: {'lr': 0.00027025, 'samples': 207744, 'steps': 1081, 'loss/train': 3.7700130939483643} +11/06/2021 21:25:38 - INFO - __main__ - Step 1083: {'lr': 0.0002705, 'samples': 207936, 'steps': 1082, 'loss/train': 3.5349581241607666} +11/06/2021 21:25:38 - INFO - __main__ - Step 1084: {'lr': 0.00027075, 'samples': 208128, 'steps': 1083, 'loss/train': 3.959185838699341} +11/06/2021 21:25:39 - INFO - __main__ - Step 1085: {'lr': 0.00027100000000000003, 'samples': 208320, 'steps': 1084, 'loss/train': 4.234473705291748} +11/06/2021 21:25:40 - INFO - __main__ - Step 1086: {'lr': 0.00027125, 'samples': 208512, 'steps': 1085, 'loss/train': 4.3777313232421875} +11/06/2021 21:25:40 - INFO - __main__ - Step 1087: {'lr': 0.00027150000000000004, 'samples': 208704, 'steps': 1086, 'loss/train': 4.0575103759765625} +11/06/2021 21:25:41 - INFO - __main__ - Step 1088: {'lr': 0.00027175, 'samples': 208896, 'steps': 1087, 'loss/train': 3.6606838703155518} +11/06/2021 21:25:41 - INFO - __main__ - Step 1089: {'lr': 0.00027200000000000005, 'samples': 209088, 'steps': 1088, 'loss/train': 4.134492874145508} +11/06/2021 21:25:41 - INFO - __main__ - Step 1090: {'lr': 0.00027225, 'samples': 209280, 'steps': 1089, 'loss/train': 3.7823238372802734} +11/06/2021 21:25:42 - INFO - __main__ - Step 1091: {'lr': 0.0002725, 'samples': 209472, 'steps': 1090, 'loss/train': 3.5656397342681885} +11/06/2021 21:25:43 - INFO - __main__ - Step 1092: {'lr': 0.00027275, 'samples': 209664, 'steps': 1091, 'loss/train': 4.612241744995117} +11/06/2021 21:25:43 - INFO - __main__ - Step 1093: {'lr': 0.000273, 'samples': 209856, 'steps': 1092, 'loss/train': 4.211349010467529} +11/06/2021 21:25:43 - INFO - __main__ - Step 1094: {'lr': 0.00027325, 'samples': 210048, 'steps': 1093, 'loss/train': 3.8772196769714355} +11/06/2021 21:25:44 - INFO - __main__ - Step 1095: {'lr': 0.00027350000000000003, 'samples': 210240, 'steps': 1094, 'loss/train': 4.242520332336426} +11/06/2021 21:25:45 - INFO - __main__ - Step 1096: {'lr': 0.00027375, 'samples': 210432, 'steps': 1095, 'loss/train': 4.067473411560059} +11/06/2021 21:25:45 - INFO - __main__ - Step 1097: {'lr': 0.00027400000000000005, 'samples': 210624, 'steps': 1096, 'loss/train': 4.022539138793945} +11/06/2021 21:25:46 - INFO - __main__ - Step 1098: {'lr': 0.00027425, 'samples': 210816, 'steps': 1097, 'loss/train': 3.810528516769409} +11/06/2021 21:25:46 - INFO - __main__ - Step 1099: {'lr': 0.0002745, 'samples': 211008, 'steps': 1098, 'loss/train': 4.089423179626465} +11/06/2021 21:25:47 - INFO - __main__ - Step 1100: {'lr': 0.00027475, 'samples': 211200, 'steps': 1099, 'loss/train': 4.257665157318115} +11/06/2021 21:25:48 - INFO - __main__ - Step 1101: {'lr': 0.000275, 'samples': 211392, 'steps': 1100, 'loss/train': 4.2323384284973145} +11/06/2021 21:25:48 - INFO - __main__ - Step 1102: {'lr': 0.00027525, 'samples': 211584, 'steps': 1101, 'loss/train': 4.789181709289551} +11/06/2021 21:25:48 - INFO - __main__ - Step 1103: {'lr': 0.00027550000000000003, 'samples': 211776, 'steps': 1102, 'loss/train': 6.588270664215088} +11/06/2021 21:25:49 - INFO - __main__ - Step 1104: {'lr': 0.00027575, 'samples': 211968, 'steps': 1103, 'loss/train': 3.7694168090820312} +11/06/2021 21:25:49 - INFO - __main__ - Step 1105: {'lr': 0.00027600000000000004, 'samples': 212160, 'steps': 1104, 'loss/train': 3.7395424842834473} +11/06/2021 21:25:50 - INFO - __main__ - Step 1106: {'lr': 0.00027625, 'samples': 212352, 'steps': 1105, 'loss/train': 4.408657073974609} +11/06/2021 21:25:51 - INFO - __main__ - Step 1107: {'lr': 0.00027650000000000005, 'samples': 212544, 'steps': 1106, 'loss/train': 4.209283828735352} +11/06/2021 21:25:51 - INFO - __main__ - Step 1108: {'lr': 0.00027675, 'samples': 212736, 'steps': 1107, 'loss/train': 4.449584007263184} +11/06/2021 21:25:51 - INFO - __main__ - Step 1109: {'lr': 0.000277, 'samples': 212928, 'steps': 1108, 'loss/train': 3.7549164295196533} +11/06/2021 21:25:52 - INFO - __main__ - Step 1110: {'lr': 0.00027725, 'samples': 213120, 'steps': 1109, 'loss/train': 4.272808074951172} +11/06/2021 21:25:52 - INFO - __main__ - Step 1111: {'lr': 0.0002775, 'samples': 213312, 'steps': 1110, 'loss/train': 4.251165390014648} +11/06/2021 21:25:53 - INFO - __main__ - Step 1112: {'lr': 0.00027775, 'samples': 213504, 'steps': 1111, 'loss/train': 4.609951972961426} +11/06/2021 21:25:54 - INFO - __main__ - Step 1113: {'lr': 0.00027800000000000004, 'samples': 213696, 'steps': 1112, 'loss/train': 4.141632556915283} +11/06/2021 21:25:54 - INFO - __main__ - Step 1114: {'lr': 0.00027825, 'samples': 213888, 'steps': 1113, 'loss/train': 4.153262615203857} +11/06/2021 21:25:54 - INFO - __main__ - Step 1115: {'lr': 0.00027850000000000005, 'samples': 214080, 'steps': 1114, 'loss/train': 3.717008113861084} +11/06/2021 21:25:55 - INFO - __main__ - Step 1116: {'lr': 0.00027875, 'samples': 214272, 'steps': 1115, 'loss/train': 3.0349667072296143} +11/06/2021 21:25:56 - INFO - __main__ - Step 1117: {'lr': 0.000279, 'samples': 214464, 'steps': 1116, 'loss/train': 5.148609161376953} +11/06/2021 21:25:56 - INFO - __main__ - Step 1118: {'lr': 0.00027925, 'samples': 214656, 'steps': 1117, 'loss/train': 4.0414958000183105} +11/06/2021 21:25:56 - INFO - __main__ - Step 1119: {'lr': 0.0002795, 'samples': 214848, 'steps': 1118, 'loss/train': 3.6977531909942627} +11/06/2021 21:25:57 - INFO - __main__ - Step 1120: {'lr': 0.00027975, 'samples': 215040, 'steps': 1119, 'loss/train': 3.3791584968566895} +11/06/2021 21:25:57 - INFO - __main__ - Step 1121: {'lr': 0.00028000000000000003, 'samples': 215232, 'steps': 1120, 'loss/train': 3.486509084701538} +11/06/2021 21:25:57 - INFO - __main__ - Step 1122: {'lr': 0.00028025, 'samples': 215424, 'steps': 1121, 'loss/train': 4.281680583953857} +11/06/2021 21:25:59 - INFO - __main__ - Step 1123: {'lr': 0.00028050000000000004, 'samples': 215616, 'steps': 1122, 'loss/train': 5.040244102478027} +11/06/2021 21:25:59 - INFO - __main__ - Step 1124: {'lr': 0.00028075, 'samples': 215808, 'steps': 1123, 'loss/train': 3.963624954223633} +11/06/2021 21:25:59 - INFO - __main__ - Step 1125: {'lr': 0.00028100000000000005, 'samples': 216000, 'steps': 1124, 'loss/train': 3.8375720977783203} +11/06/2021 21:26:00 - INFO - __main__ - Step 1126: {'lr': 0.00028125000000000003, 'samples': 216192, 'steps': 1125, 'loss/train': 4.240171432495117} +11/06/2021 21:26:00 - INFO - __main__ - Step 1127: {'lr': 0.00028149999999999996, 'samples': 216384, 'steps': 1126, 'loss/train': 3.637873888015747} +11/06/2021 21:26:01 - INFO - __main__ - Step 1128: {'lr': 0.00028175, 'samples': 216576, 'steps': 1127, 'loss/train': 3.8652379512786865} +11/06/2021 21:26:01 - INFO - __main__ - Step 1129: {'lr': 0.00028199999999999997, 'samples': 216768, 'steps': 1128, 'loss/train': 4.120966911315918} +11/06/2021 21:26:02 - INFO - __main__ - Step 1130: {'lr': 0.00028225, 'samples': 216960, 'steps': 1129, 'loss/train': 4.294138431549072} +11/06/2021 21:26:02 - INFO - __main__ - Step 1131: {'lr': 0.0002825, 'samples': 217152, 'steps': 1130, 'loss/train': 3.7788121700286865} +11/06/2021 21:26:02 - INFO - __main__ - Step 1132: {'lr': 0.00028275, 'samples': 217344, 'steps': 1131, 'loss/train': 3.901336908340454} +11/06/2021 21:26:03 - INFO - __main__ - Step 1133: {'lr': 0.000283, 'samples': 217536, 'steps': 1132, 'loss/train': 4.027707099914551} +11/06/2021 21:26:04 - INFO - __main__ - Step 1134: {'lr': 0.00028325000000000003, 'samples': 217728, 'steps': 1133, 'loss/train': 4.218957424163818} +11/06/2021 21:26:04 - INFO - __main__ - Step 1135: {'lr': 0.0002835, 'samples': 217920, 'steps': 1134, 'loss/train': 4.311142444610596} +11/06/2021 21:26:05 - INFO - __main__ - Step 1136: {'lr': 0.00028375, 'samples': 218112, 'steps': 1135, 'loss/train': 4.181615352630615} +11/06/2021 21:26:05 - INFO - __main__ - Step 1137: {'lr': 0.00028399999999999996, 'samples': 218304, 'steps': 1136, 'loss/train': 3.916645050048828} +11/06/2021 21:26:06 - INFO - __main__ - Step 1138: {'lr': 0.00028425, 'samples': 218496, 'steps': 1137, 'loss/train': 4.085984706878662} +11/06/2021 21:26:06 - INFO - __main__ - Step 1139: {'lr': 0.0002845, 'samples': 218688, 'steps': 1138, 'loss/train': 4.673676013946533} +11/06/2021 21:26:07 - INFO - __main__ - Step 1140: {'lr': 0.00028475, 'samples': 218880, 'steps': 1139, 'loss/train': 4.280994415283203} +11/06/2021 21:26:07 - INFO - __main__ - Step 1141: {'lr': 0.000285, 'samples': 219072, 'steps': 1140, 'loss/train': 4.047427177429199} +11/06/2021 21:26:07 - INFO - __main__ - Step 1142: {'lr': 0.00028525, 'samples': 219264, 'steps': 1141, 'loss/train': 3.885024070739746} +11/06/2021 21:26:08 - INFO - __main__ - Step 1143: {'lr': 0.0002855, 'samples': 219456, 'steps': 1142, 'loss/train': 4.40393590927124} +11/06/2021 21:26:09 - INFO - __main__ - Step 1144: {'lr': 0.00028575000000000003, 'samples': 219648, 'steps': 1143, 'loss/train': 4.992481708526611} +11/06/2021 21:26:09 - INFO - __main__ - Step 1145: {'lr': 0.00028599999999999996, 'samples': 219840, 'steps': 1144, 'loss/train': 4.026183128356934} +11/06/2021 21:26:10 - INFO - __main__ - Step 1146: {'lr': 0.00028625, 'samples': 220032, 'steps': 1145, 'loss/train': 3.5987935066223145} +11/06/2021 21:26:10 - INFO - __main__ - Step 1147: {'lr': 0.00028649999999999997, 'samples': 220224, 'steps': 1146, 'loss/train': 4.403866767883301} +11/06/2021 21:26:11 - INFO - __main__ - Step 1148: {'lr': 0.00028675, 'samples': 220416, 'steps': 1147, 'loss/train': 3.9268059730529785} +11/06/2021 21:26:11 - INFO - __main__ - Step 1149: {'lr': 0.000287, 'samples': 220608, 'steps': 1148, 'loss/train': 3.6902759075164795} +11/06/2021 21:26:12 - INFO - __main__ - Step 1150: {'lr': 0.00028725, 'samples': 220800, 'steps': 1149, 'loss/train': 4.134997367858887} +11/06/2021 21:26:12 - INFO - __main__ - Step 1151: {'lr': 0.0002875, 'samples': 220992, 'steps': 1150, 'loss/train': 3.9367594718933105} +11/06/2021 21:26:12 - INFO - __main__ - Step 1152: {'lr': 0.00028775000000000003, 'samples': 221184, 'steps': 1151, 'loss/train': 3.4053988456726074} +11/06/2021 21:26:13 - INFO - __main__ - Step 1153: {'lr': 0.000288, 'samples': 221376, 'steps': 1152, 'loss/train': 4.11300802230835} +11/06/2021 21:26:14 - INFO - __main__ - Step 1154: {'lr': 0.00028825, 'samples': 221568, 'steps': 1153, 'loss/train': 3.790684700012207} +11/06/2021 21:26:14 - INFO - __main__ - Step 1155: {'lr': 0.00028849999999999997, 'samples': 221760, 'steps': 1154, 'loss/train': 4.096200942993164} +11/06/2021 21:26:14 - INFO - __main__ - Step 1156: {'lr': 0.00028875, 'samples': 221952, 'steps': 1155, 'loss/train': 4.3799262046813965} +11/06/2021 21:26:15 - INFO - __main__ - Step 1157: {'lr': 0.000289, 'samples': 222144, 'steps': 1156, 'loss/train': 4.1134748458862305} +11/06/2021 21:26:15 - INFO - __main__ - Step 1158: {'lr': 0.00028925, 'samples': 222336, 'steps': 1157, 'loss/train': 4.462249755859375} +11/06/2021 21:26:16 - INFO - __main__ - Step 1159: {'lr': 0.0002895, 'samples': 222528, 'steps': 1158, 'loss/train': 2.7520174980163574} +11/06/2021 21:26:16 - INFO - __main__ - Step 1160: {'lr': 0.00028975, 'samples': 222720, 'steps': 1159, 'loss/train': 4.172967910766602} +11/06/2021 21:26:17 - INFO - __main__ - Step 1161: {'lr': 0.00029, 'samples': 222912, 'steps': 1160, 'loss/train': 3.451906204223633} +11/06/2021 21:26:17 - INFO - __main__ - Step 1162: {'lr': 0.00029025000000000003, 'samples': 223104, 'steps': 1161, 'loss/train': 4.355815887451172} +11/06/2021 21:26:18 - INFO - __main__ - Step 1163: {'lr': 0.00029049999999999996, 'samples': 223296, 'steps': 1162, 'loss/train': 4.1517109870910645} +11/06/2021 21:26:19 - INFO - __main__ - Step 1164: {'lr': 0.00029075, 'samples': 223488, 'steps': 1163, 'loss/train': 4.004212856292725} +11/06/2021 21:26:19 - INFO - __main__ - Step 1165: {'lr': 0.00029099999999999997, 'samples': 223680, 'steps': 1164, 'loss/train': 4.073708534240723} +11/06/2021 21:26:19 - INFO - __main__ - Step 1166: {'lr': 0.00029125, 'samples': 223872, 'steps': 1165, 'loss/train': 4.045283317565918} +11/06/2021 21:26:20 - INFO - __main__ - Step 1167: {'lr': 0.0002915, 'samples': 224064, 'steps': 1166, 'loss/train': 3.959521770477295} +11/06/2021 21:26:20 - INFO - __main__ - Step 1168: {'lr': 0.00029175, 'samples': 224256, 'steps': 1167, 'loss/train': 3.8172402381896973} +11/06/2021 21:26:21 - INFO - __main__ - Step 1169: {'lr': 0.000292, 'samples': 224448, 'steps': 1168, 'loss/train': 3.809446096420288} +11/06/2021 21:26:21 - INFO - __main__ - Step 1170: {'lr': 0.00029225000000000003, 'samples': 224640, 'steps': 1169, 'loss/train': 4.352285385131836} +11/06/2021 21:26:22 - INFO - __main__ - Step 1171: {'lr': 0.0002925, 'samples': 224832, 'steps': 1170, 'loss/train': 3.0493404865264893} +11/06/2021 21:26:22 - INFO - __main__ - Step 1172: {'lr': 0.00029275000000000004, 'samples': 225024, 'steps': 1171, 'loss/train': 4.092573642730713} +11/06/2021 21:26:22 - INFO - __main__ - Step 1173: {'lr': 0.00029299999999999997, 'samples': 225216, 'steps': 1172, 'loss/train': 4.186103820800781} +11/06/2021 21:26:23 - INFO - __main__ - Step 1174: {'lr': 0.00029325, 'samples': 225408, 'steps': 1173, 'loss/train': 3.786396026611328} +11/06/2021 21:26:24 - INFO - __main__ - Step 1175: {'lr': 0.0002935, 'samples': 225600, 'steps': 1174, 'loss/train': 4.53329610824585} +11/06/2021 21:26:24 - INFO - __main__ - Step 1176: {'lr': 0.00029375, 'samples': 225792, 'steps': 1175, 'loss/train': 3.6532394886016846} +11/06/2021 21:26:24 - INFO - __main__ - Step 1177: {'lr': 0.000294, 'samples': 225984, 'steps': 1176, 'loss/train': 3.6320600509643555} +11/06/2021 21:26:25 - INFO - __main__ - Step 1178: {'lr': 0.00029425, 'samples': 226176, 'steps': 1177, 'loss/train': 3.9214487075805664} +11/06/2021 21:26:26 - INFO - __main__ - Step 1179: {'lr': 0.0002945, 'samples': 226368, 'steps': 1178, 'loss/train': 3.6811251640319824} +11/06/2021 21:26:26 - INFO - __main__ - Step 1180: {'lr': 0.00029475000000000004, 'samples': 226560, 'steps': 1179, 'loss/train': 3.892512559890747} +11/06/2021 21:26:27 - INFO - __main__ - Step 1181: {'lr': 0.000295, 'samples': 226752, 'steps': 1180, 'loss/train': 4.335596561431885} +11/06/2021 21:26:27 - INFO - __main__ - Step 1182: {'lr': 0.00029525, 'samples': 226944, 'steps': 1181, 'loss/train': 3.9504594802856445} +11/06/2021 21:26:27 - INFO - __main__ - Step 1183: {'lr': 0.00029549999999999997, 'samples': 227136, 'steps': 1182, 'loss/train': 4.172230243682861} +11/06/2021 21:26:28 - INFO - __main__ - Step 1184: {'lr': 0.00029575, 'samples': 227328, 'steps': 1183, 'loss/train': 4.093757152557373} +11/06/2021 21:26:29 - INFO - __main__ - Step 1185: {'lr': 0.000296, 'samples': 227520, 'steps': 1184, 'loss/train': 3.9272379875183105} +11/06/2021 21:26:29 - INFO - __main__ - Step 1186: {'lr': 0.00029625, 'samples': 227712, 'steps': 1185, 'loss/train': 3.678920269012451} +11/06/2021 21:26:29 - INFO - __main__ - Step 1187: {'lr': 0.0002965, 'samples': 227904, 'steps': 1186, 'loss/train': 3.9552578926086426} +11/06/2021 21:26:30 - INFO - __main__ - Step 1188: {'lr': 0.00029675000000000003, 'samples': 228096, 'steps': 1187, 'loss/train': 3.7164466381073} +11/06/2021 21:26:30 - INFO - __main__ - Step 1189: {'lr': 0.000297, 'samples': 228288, 'steps': 1188, 'loss/train': 4.196506977081299} +11/06/2021 21:26:31 - INFO - __main__ - Step 1190: {'lr': 0.00029725000000000004, 'samples': 228480, 'steps': 1189, 'loss/train': 3.887439489364624} +11/06/2021 21:26:31 - INFO - __main__ - Step 1191: {'lr': 0.00029749999999999997, 'samples': 228672, 'steps': 1190, 'loss/train': 3.7323334217071533} +11/06/2021 21:26:32 - INFO - __main__ - Step 1192: {'lr': 0.00029775, 'samples': 228864, 'steps': 1191, 'loss/train': 4.008239269256592} +11/06/2021 21:26:32 - INFO - __main__ - Step 1193: {'lr': 0.000298, 'samples': 229056, 'steps': 1192, 'loss/train': 5.458200454711914} +11/06/2021 21:26:33 - INFO - __main__ - Step 1194: {'lr': 0.00029825, 'samples': 229248, 'steps': 1193, 'loss/train': 3.7591049671173096} +11/06/2021 21:26:34 - INFO - __main__ - Step 1195: {'lr': 0.0002985, 'samples': 229440, 'steps': 1194, 'loss/train': 4.328658103942871} +11/06/2021 21:26:34 - INFO - __main__ - Step 1196: {'lr': 0.00029875, 'samples': 229632, 'steps': 1195, 'loss/train': 3.8931264877319336} +11/06/2021 21:26:34 - INFO - __main__ - Step 1197: {'lr': 0.000299, 'samples': 229824, 'steps': 1196, 'loss/train': 4.966779708862305} +11/06/2021 21:26:35 - INFO - __main__ - Step 1198: {'lr': 0.00029925000000000004, 'samples': 230016, 'steps': 1197, 'loss/train': 3.1090831756591797} +11/06/2021 21:26:35 - INFO - __main__ - Step 1199: {'lr': 0.0002995, 'samples': 230208, 'steps': 1198, 'loss/train': 3.9816088676452637} +11/06/2021 21:26:36 - INFO - __main__ - Step 1200: {'lr': 0.00029975000000000005, 'samples': 230400, 'steps': 1199, 'loss/train': 4.041784286499023} +11/06/2021 21:26:36 - INFO - __main__ - Step 1201: {'lr': 0.0003, 'samples': 230592, 'steps': 1200, 'loss/train': 3.73962664604187} +11/06/2021 21:26:37 - INFO - __main__ - Step 1202: {'lr': 0.00030025, 'samples': 230784, 'steps': 1201, 'loss/train': 3.259591579437256} +11/06/2021 21:26:37 - INFO - __main__ - Step 1203: {'lr': 0.0003005, 'samples': 230976, 'steps': 1202, 'loss/train': 4.60701322555542} +11/06/2021 21:26:37 - INFO - __main__ - Step 1204: {'lr': 0.00030075, 'samples': 231168, 'steps': 1203, 'loss/train': 4.123647689819336} +11/06/2021 21:26:39 - INFO - __main__ - Step 1205: {'lr': 0.000301, 'samples': 231360, 'steps': 1204, 'loss/train': 4.385739326477051} +11/06/2021 21:26:39 - INFO - __main__ - Step 1206: {'lr': 0.00030125000000000003, 'samples': 231552, 'steps': 1205, 'loss/train': 3.796212911605835} +11/06/2021 21:26:39 - INFO - __main__ - Step 1207: {'lr': 0.0003015, 'samples': 231744, 'steps': 1206, 'loss/train': 4.638833999633789} +11/06/2021 21:26:40 - INFO - __main__ - Step 1208: {'lr': 0.00030175000000000004, 'samples': 231936, 'steps': 1207, 'loss/train': 4.022327423095703} +11/06/2021 21:26:40 - INFO - __main__ - Step 1209: {'lr': 0.000302, 'samples': 232128, 'steps': 1208, 'loss/train': 4.19215202331543} +11/06/2021 21:26:41 - INFO - __main__ - Step 1210: {'lr': 0.00030225, 'samples': 232320, 'steps': 1209, 'loss/train': 4.021753787994385} +11/06/2021 21:26:41 - INFO - __main__ - Step 1211: {'lr': 0.0003025, 'samples': 232512, 'steps': 1210, 'loss/train': 3.7708232402801514} +11/06/2021 21:26:42 - INFO - __main__ - Step 1212: {'lr': 0.00030275, 'samples': 232704, 'steps': 1211, 'loss/train': 3.500831365585327} +11/06/2021 21:26:42 - INFO - __main__ - Step 1213: {'lr': 0.000303, 'samples': 232896, 'steps': 1212, 'loss/train': 3.7347517013549805} +11/06/2021 21:26:42 - INFO - __main__ - Step 1214: {'lr': 0.00030325, 'samples': 233088, 'steps': 1213, 'loss/train': 3.712738275527954} +11/06/2021 21:26:43 - INFO - __main__ - Step 1215: {'lr': 0.0003035, 'samples': 233280, 'steps': 1214, 'loss/train': 4.544304370880127} +11/06/2021 21:26:44 - INFO - __main__ - Step 1216: {'lr': 0.00030375000000000004, 'samples': 233472, 'steps': 1215, 'loss/train': 3.8694875240325928} +11/06/2021 21:26:44 - INFO - __main__ - Step 1217: {'lr': 0.000304, 'samples': 233664, 'steps': 1216, 'loss/train': 3.3171164989471436} +11/06/2021 21:26:44 - INFO - __main__ - Step 1218: {'lr': 0.00030425000000000005, 'samples': 233856, 'steps': 1217, 'loss/train': 3.7530202865600586} +11/06/2021 21:26:45 - INFO - __main__ - Step 1219: {'lr': 0.0003045, 'samples': 234048, 'steps': 1218, 'loss/train': 3.967923879623413} +11/06/2021 21:26:45 - INFO - __main__ - Step 1220: {'lr': 0.00030475, 'samples': 234240, 'steps': 1219, 'loss/train': 3.715089797973633} +11/06/2021 21:26:46 - INFO - __main__ - Step 1221: {'lr': 0.000305, 'samples': 234432, 'steps': 1220, 'loss/train': 3.693310260772705} +11/06/2021 21:26:46 - INFO - __main__ - Step 1222: {'lr': 0.00030525, 'samples': 234624, 'steps': 1221, 'loss/train': 3.5755531787872314} +11/06/2021 21:26:47 - INFO - __main__ - Step 1223: {'lr': 0.0003055, 'samples': 234816, 'steps': 1222, 'loss/train': 4.144630432128906} +11/06/2021 21:26:47 - INFO - __main__ - Step 1224: {'lr': 0.00030575000000000003, 'samples': 235008, 'steps': 1223, 'loss/train': 3.8937008380889893} +11/06/2021 21:26:48 - INFO - __main__ - Step 1225: {'lr': 0.000306, 'samples': 235200, 'steps': 1224, 'loss/train': 3.7765586376190186} +11/06/2021 21:26:48 - INFO - __main__ - Step 1226: {'lr': 0.00030625000000000004, 'samples': 235392, 'steps': 1225, 'loss/train': 4.3001017570495605} +11/06/2021 21:26:49 - INFO - __main__ - Step 1227: {'lr': 0.0003065, 'samples': 235584, 'steps': 1226, 'loss/train': 3.861295461654663} +11/06/2021 21:26:49 - INFO - __main__ - Step 1228: {'lr': 0.00030675, 'samples': 235776, 'steps': 1227, 'loss/train': 4.244755268096924} +11/06/2021 21:26:50 - INFO - __main__ - Step 1229: {'lr': 0.000307, 'samples': 235968, 'steps': 1228, 'loss/train': 4.392697811126709} +11/06/2021 21:26:50 - INFO - __main__ - Step 1230: {'lr': 0.00030725, 'samples': 236160, 'steps': 1229, 'loss/train': 4.003592014312744} +11/06/2021 21:26:51 - INFO - __main__ - Step 1231: {'lr': 0.0003075, 'samples': 236352, 'steps': 1230, 'loss/train': 3.7558765411376953} +11/06/2021 21:26:51 - INFO - __main__ - Step 1232: {'lr': 0.00030775, 'samples': 236544, 'steps': 1231, 'loss/train': 3.535252571105957} +11/06/2021 21:26:52 - INFO - __main__ - Step 1233: {'lr': 0.000308, 'samples': 236736, 'steps': 1232, 'loss/train': 3.4438316822052} +11/06/2021 21:26:52 - INFO - __main__ - Step 1234: {'lr': 0.00030825000000000004, 'samples': 236928, 'steps': 1233, 'loss/train': 3.6062018871307373} +11/06/2021 21:26:52 - INFO - __main__ - Step 1235: {'lr': 0.0003085, 'samples': 237120, 'steps': 1234, 'loss/train': 3.9174911975860596} +11/06/2021 21:26:53 - INFO - __main__ - Step 1236: {'lr': 0.00030875000000000005, 'samples': 237312, 'steps': 1235, 'loss/train': 3.6126482486724854} +11/06/2021 21:26:54 - INFO - __main__ - Step 1237: {'lr': 0.00030900000000000003, 'samples': 237504, 'steps': 1236, 'loss/train': 3.4603700637817383} +11/06/2021 21:26:54 - INFO - __main__ - Step 1238: {'lr': 0.00030925, 'samples': 237696, 'steps': 1237, 'loss/train': 5.033356666564941} +11/06/2021 21:26:54 - INFO - __main__ - Step 1239: {'lr': 0.0003095, 'samples': 237888, 'steps': 1238, 'loss/train': 3.9721944332122803} +11/06/2021 21:26:55 - INFO - __main__ - Step 1240: {'lr': 0.00030975, 'samples': 238080, 'steps': 1239, 'loss/train': 3.999577045440674} +11/06/2021 21:26:56 - INFO - __main__ - Step 1241: {'lr': 0.00031, 'samples': 238272, 'steps': 1240, 'loss/train': 3.221419334411621} +11/06/2021 21:26:56 - INFO - __main__ - Step 1242: {'lr': 0.00031025000000000003, 'samples': 238464, 'steps': 1241, 'loss/train': 3.553842067718506} +11/06/2021 21:26:57 - INFO - __main__ - Step 1243: {'lr': 0.0003105, 'samples': 238656, 'steps': 1242, 'loss/train': 3.4750494956970215} +11/06/2021 21:26:57 - INFO - __main__ - Step 1244: {'lr': 0.00031075000000000005, 'samples': 238848, 'steps': 1243, 'loss/train': 3.7925238609313965} +11/06/2021 21:26:57 - INFO - __main__ - Step 1245: {'lr': 0.000311, 'samples': 239040, 'steps': 1244, 'loss/train': 4.293489456176758} +11/06/2021 21:26:58 - INFO - __main__ - Step 1246: {'lr': 0.00031125000000000006, 'samples': 239232, 'steps': 1245, 'loss/train': 3.7371480464935303} +11/06/2021 21:26:59 - INFO - __main__ - Step 1247: {'lr': 0.0003115, 'samples': 239424, 'steps': 1246, 'loss/train': 4.00302791595459} +11/06/2021 21:26:59 - INFO - __main__ - Step 1248: {'lr': 0.00031175, 'samples': 239616, 'steps': 1247, 'loss/train': 3.7047793865203857} +11/06/2021 21:27:00 - INFO - __main__ - Step 1249: {'lr': 0.000312, 'samples': 239808, 'steps': 1248, 'loss/train': 4.603279113769531} +11/06/2021 21:27:00 - INFO - __main__ - Step 1250: {'lr': 0.00031225000000000003, 'samples': 240000, 'steps': 1249, 'loss/train': 3.6074068546295166} +11/06/2021 21:27:00 - INFO - __main__ - Step 1251: {'lr': 0.0003125, 'samples': 240192, 'steps': 1250, 'loss/train': 4.296557903289795} +11/06/2021 21:27:01 - INFO - __main__ - Step 1252: {'lr': 0.00031275, 'samples': 240384, 'steps': 1251, 'loss/train': 3.7983367443084717} +11/06/2021 21:27:02 - INFO - __main__ - Step 1253: {'lr': 0.000313, 'samples': 240576, 'steps': 1252, 'loss/train': 3.8672046661376953} +11/06/2021 21:27:02 - INFO - __main__ - Step 1254: {'lr': 0.00031325, 'samples': 240768, 'steps': 1253, 'loss/train': 3.8182613849639893} +11/06/2021 21:27:02 - INFO - __main__ - Step 1255: {'lr': 0.00031350000000000003, 'samples': 240960, 'steps': 1254, 'loss/train': 3.425907850265503} +11/06/2021 21:27:03 - INFO - __main__ - Step 1256: {'lr': 0.00031374999999999996, 'samples': 241152, 'steps': 1255, 'loss/train': 3.5726277828216553} +11/06/2021 21:27:04 - INFO - __main__ - Step 1257: {'lr': 0.000314, 'samples': 241344, 'steps': 1256, 'loss/train': 3.928713083267212} +11/06/2021 21:27:04 - INFO - __main__ - Step 1258: {'lr': 0.00031424999999999997, 'samples': 241536, 'steps': 1257, 'loss/train': 3.986309289932251} +11/06/2021 21:27:04 - INFO - __main__ - Step 1259: {'lr': 0.0003145, 'samples': 241728, 'steps': 1258, 'loss/train': 4.367678642272949} +11/06/2021 21:27:05 - INFO - __main__ - Step 1260: {'lr': 0.00031475, 'samples': 241920, 'steps': 1259, 'loss/train': 3.995647430419922} +11/06/2021 21:27:05 - INFO - __main__ - Step 1261: {'lr': 0.000315, 'samples': 242112, 'steps': 1260, 'loss/train': 3.605346441268921} +11/06/2021 21:27:06 - INFO - __main__ - Step 1262: {'lr': 0.00031525, 'samples': 242304, 'steps': 1261, 'loss/train': 3.96653413772583} +11/06/2021 21:27:06 - INFO - __main__ - Step 1263: {'lr': 0.0003155, 'samples': 242496, 'steps': 1262, 'loss/train': 3.9042797088623047} +11/06/2021 21:27:07 - INFO - __main__ - Step 1264: {'lr': 0.00031575, 'samples': 242688, 'steps': 1263, 'loss/train': 3.5482776165008545} +11/06/2021 21:27:07 - INFO - __main__ - Step 1265: {'lr': 0.000316, 'samples': 242880, 'steps': 1264, 'loss/train': 3.473890781402588} +11/06/2021 21:27:07 - INFO - __main__ - Step 1266: {'lr': 0.00031624999999999996, 'samples': 243072, 'steps': 1265, 'loss/train': 3.6147239208221436} +11/06/2021 21:27:08 - INFO - __main__ - Step 1267: {'lr': 0.0003165, 'samples': 243264, 'steps': 1266, 'loss/train': 3.760866403579712} +11/06/2021 21:27:09 - INFO - __main__ - Step 1268: {'lr': 0.00031675, 'samples': 243456, 'steps': 1267, 'loss/train': 3.5120933055877686} +11/06/2021 21:27:10 - INFO - __main__ - Step 1269: {'lr': 0.000317, 'samples': 243648, 'steps': 1268, 'loss/train': 4.119743824005127} +11/06/2021 21:27:10 - INFO - __main__ - Step 1270: {'lr': 0.00031725, 'samples': 243840, 'steps': 1269, 'loss/train': 4.16604471206665} +11/06/2021 21:27:10 - INFO - __main__ - Step 1271: {'lr': 0.0003175, 'samples': 244032, 'steps': 1270, 'loss/train': 3.718264102935791} +11/06/2021 21:27:11 - INFO - __main__ - Step 1272: {'lr': 0.00031775, 'samples': 244224, 'steps': 1271, 'loss/train': 3.804915428161621} +11/06/2021 21:27:12 - INFO - __main__ - Step 1273: {'lr': 0.00031800000000000003, 'samples': 244416, 'steps': 1272, 'loss/train': 3.632591724395752} +11/06/2021 21:27:12 - INFO - __main__ - Step 1274: {'lr': 0.00031825, 'samples': 244608, 'steps': 1273, 'loss/train': 3.5990989208221436} +11/06/2021 21:27:12 - INFO - __main__ - Step 1275: {'lr': 0.0003185, 'samples': 244800, 'steps': 1274, 'loss/train': 3.5454981327056885} +11/06/2021 21:27:13 - INFO - __main__ - Step 1276: {'lr': 0.00031874999999999997, 'samples': 244992, 'steps': 1275, 'loss/train': 2.8243398666381836} +11/06/2021 21:27:13 - INFO - __main__ - Step 1277: {'lr': 0.000319, 'samples': 245184, 'steps': 1276, 'loss/train': 4.374372959136963} +11/06/2021 21:27:14 - INFO - __main__ - Step 1278: {'lr': 0.00031925, 'samples': 245376, 'steps': 1277, 'loss/train': 2.880706548690796} +11/06/2021 21:27:15 - INFO - __main__ - Step 1279: {'lr': 0.0003195, 'samples': 245568, 'steps': 1278, 'loss/train': 3.749918222427368} +11/06/2021 21:27:15 - INFO - __main__ - Step 1280: {'lr': 0.00031975, 'samples': 245760, 'steps': 1279, 'loss/train': 3.91780686378479} +11/06/2021 21:27:15 - INFO - __main__ - Step 1281: {'lr': 0.00032, 'samples': 245952, 'steps': 1280, 'loss/train': 3.8567497730255127} +11/06/2021 21:27:16 - INFO - __main__ - Step 1282: {'lr': 0.00032025, 'samples': 246144, 'steps': 1281, 'loss/train': 2.492274761199951} +11/06/2021 21:27:17 - INFO - __main__ - Step 1283: {'lr': 0.00032050000000000004, 'samples': 246336, 'steps': 1282, 'loss/train': 4.012140274047852} +11/06/2021 21:27:17 - INFO - __main__ - Step 1284: {'lr': 0.00032074999999999996, 'samples': 246528, 'steps': 1283, 'loss/train': 3.700061559677124} +11/06/2021 21:27:17 - INFO - __main__ - Step 1285: {'lr': 0.000321, 'samples': 246720, 'steps': 1284, 'loss/train': 4.031924724578857} +11/06/2021 21:27:18 - INFO - __main__ - Step 1286: {'lr': 0.00032125, 'samples': 246912, 'steps': 1285, 'loss/train': 4.252817153930664} +11/06/2021 21:27:18 - INFO - __main__ - Step 1287: {'lr': 0.0003215, 'samples': 247104, 'steps': 1286, 'loss/train': 3.6342227458953857} +11/06/2021 21:27:19 - INFO - __main__ - Step 1288: {'lr': 0.00032175, 'samples': 247296, 'steps': 1287, 'loss/train': 3.6176106929779053} +11/06/2021 21:27:20 - INFO - __main__ - Step 1289: {'lr': 0.000322, 'samples': 247488, 'steps': 1288, 'loss/train': 5.5985236167907715} +11/06/2021 21:27:20 - INFO - __main__ - Step 1290: {'lr': 0.00032225, 'samples': 247680, 'steps': 1289, 'loss/train': 3.5907435417175293} +11/06/2021 21:27:20 - INFO - __main__ - Step 1291: {'lr': 0.00032250000000000003, 'samples': 247872, 'steps': 1290, 'loss/train': 3.7204911708831787} +11/06/2021 21:27:21 - INFO - __main__ - Step 1292: {'lr': 0.00032275, 'samples': 248064, 'steps': 1291, 'loss/train': 3.9456405639648438} +11/06/2021 21:27:22 - INFO - __main__ - Step 1293: {'lr': 0.000323, 'samples': 248256, 'steps': 1292, 'loss/train': 3.7843210697174072} +11/06/2021 21:27:22 - INFO - __main__ - Step 1294: {'lr': 0.00032324999999999997, 'samples': 248448, 'steps': 1293, 'loss/train': 3.915496349334717} +11/06/2021 21:27:22 - INFO - __main__ - Step 1295: {'lr': 0.0003235, 'samples': 248640, 'steps': 1294, 'loss/train': 4.2259440422058105} +11/06/2021 21:27:23 - INFO - __main__ - Step 1296: {'lr': 0.00032375, 'samples': 248832, 'steps': 1295, 'loss/train': 3.61068058013916} +11/06/2021 21:27:23 - INFO - __main__ - Step 1297: {'lr': 0.000324, 'samples': 249024, 'steps': 1296, 'loss/train': 3.682305097579956} +11/06/2021 21:27:24 - INFO - __main__ - Step 1298: {'lr': 0.00032425, 'samples': 249216, 'steps': 1297, 'loss/train': 3.750075340270996} +11/06/2021 21:27:25 - INFO - __main__ - Step 1299: {'lr': 0.00032450000000000003, 'samples': 249408, 'steps': 1298, 'loss/train': 3.9268178939819336} +11/06/2021 21:27:25 - INFO - __main__ - Step 1300: {'lr': 0.00032475, 'samples': 249600, 'steps': 1299, 'loss/train': 3.8040266036987305} +11/06/2021 21:27:25 - INFO - __main__ - Step 1301: {'lr': 0.00032500000000000004, 'samples': 249792, 'steps': 1300, 'loss/train': 3.4303956031799316} +11/06/2021 21:27:26 - INFO - __main__ - Step 1302: {'lr': 0.00032524999999999996, 'samples': 249984, 'steps': 1301, 'loss/train': 4.067983150482178} +11/06/2021 21:27:27 - INFO - __main__ - Step 1303: {'lr': 0.0003255, 'samples': 250176, 'steps': 1302, 'loss/train': 3.6090753078460693} +11/06/2021 21:27:27 - INFO - __main__ - Step 1304: {'lr': 0.00032575, 'samples': 250368, 'steps': 1303, 'loss/train': 3.846041440963745} +11/06/2021 21:27:27 - INFO - __main__ - Step 1305: {'lr': 0.000326, 'samples': 250560, 'steps': 1304, 'loss/train': 4.3484272956848145} +11/06/2021 21:27:28 - INFO - __main__ - Step 1306: {'lr': 0.00032625, 'samples': 250752, 'steps': 1305, 'loss/train': 3.714219331741333} +11/06/2021 21:27:28 - INFO - __main__ - Step 1307: {'lr': 0.0003265, 'samples': 250944, 'steps': 1306, 'loss/train': 3.670234441757202} +11/06/2021 21:27:29 - INFO - __main__ - Step 1308: {'lr': 0.00032675, 'samples': 251136, 'steps': 1307, 'loss/train': 4.2095441818237305} +11/06/2021 21:27:29 - INFO - __main__ - Step 1309: {'lr': 0.00032700000000000003, 'samples': 251328, 'steps': 1308, 'loss/train': 3.6904191970825195} +11/06/2021 21:27:30 - INFO - __main__ - Step 1310: {'lr': 0.00032725, 'samples': 251520, 'steps': 1309, 'loss/train': 3.5426836013793945} +11/06/2021 21:27:30 - INFO - __main__ - Step 1311: {'lr': 0.00032750000000000005, 'samples': 251712, 'steps': 1310, 'loss/train': 3.8077216148376465} +11/06/2021 21:27:31 - INFO - __main__ - Step 1312: {'lr': 0.00032774999999999997, 'samples': 251904, 'steps': 1311, 'loss/train': 3.6772751808166504} +11/06/2021 21:27:31 - INFO - __main__ - Step 1313: {'lr': 0.000328, 'samples': 252096, 'steps': 1312, 'loss/train': 4.283506393432617} +11/06/2021 21:27:32 - INFO - __main__ - Step 1314: {'lr': 0.00032825, 'samples': 252288, 'steps': 1313, 'loss/train': 3.820636510848999} +11/06/2021 21:27:32 - INFO - __main__ - Step 1315: {'lr': 0.0003285, 'samples': 252480, 'steps': 1314, 'loss/train': 3.645063877105713} +11/06/2021 21:27:33 - INFO - __main__ - Step 1316: {'lr': 0.00032875, 'samples': 252672, 'steps': 1315, 'loss/train': 3.96279239654541} +11/06/2021 21:27:33 - INFO - __main__ - Step 1317: {'lr': 0.00032900000000000003, 'samples': 252864, 'steps': 1316, 'loss/train': 3.848276138305664} +11/06/2021 21:27:33 - INFO - __main__ - Step 1318: {'lr': 0.00032925, 'samples': 253056, 'steps': 1317, 'loss/train': 3.3637754917144775} +11/06/2021 21:27:34 - INFO - __main__ - Step 1319: {'lr': 0.00032950000000000004, 'samples': 253248, 'steps': 1318, 'loss/train': 3.951634168624878} +11/06/2021 21:27:35 - INFO - __main__ - Step 1320: {'lr': 0.00032975, 'samples': 253440, 'steps': 1319, 'loss/train': 4.035619735717773} +11/06/2021 21:27:35 - INFO - __main__ - Step 1321: {'lr': 0.00033, 'samples': 253632, 'steps': 1320, 'loss/train': 3.623622179031372} +11/06/2021 21:27:35 - INFO - __main__ - Step 1322: {'lr': 0.00033025, 'samples': 253824, 'steps': 1321, 'loss/train': 4.259491920471191} +11/06/2021 21:27:36 - INFO - __main__ - Step 1323: {'lr': 0.0003305, 'samples': 254016, 'steps': 1322, 'loss/train': 3.655144214630127} +11/06/2021 21:27:37 - INFO - __main__ - Step 1324: {'lr': 0.00033075, 'samples': 254208, 'steps': 1323, 'loss/train': 3.6705875396728516} +11/06/2021 21:27:37 - INFO - __main__ - Step 1325: {'lr': 0.000331, 'samples': 254400, 'steps': 1324, 'loss/train': 3.493577480316162} +11/06/2021 21:27:38 - INFO - __main__ - Step 1326: {'lr': 0.00033125, 'samples': 254592, 'steps': 1325, 'loss/train': 3.0190889835357666} +11/06/2021 21:27:38 - INFO - __main__ - Step 1327: {'lr': 0.00033150000000000003, 'samples': 254784, 'steps': 1326, 'loss/train': 4.079080104827881} +11/06/2021 21:27:38 - INFO - __main__ - Step 1328: {'lr': 0.00033175, 'samples': 254976, 'steps': 1327, 'loss/train': 3.815504550933838} +11/06/2021 21:27:39 - INFO - __main__ - Step 1329: {'lr': 0.00033200000000000005, 'samples': 255168, 'steps': 1328, 'loss/train': 3.4887773990631104} +11/06/2021 21:27:40 - INFO - __main__ - Step 1330: {'lr': 0.00033224999999999997, 'samples': 255360, 'steps': 1329, 'loss/train': 3.8788294792175293} +11/06/2021 21:27:40 - INFO - __main__ - Step 1331: {'lr': 0.0003325, 'samples': 255552, 'steps': 1330, 'loss/train': 3.5784215927124023} +11/06/2021 21:27:40 - INFO - __main__ - Step 1332: {'lr': 0.00033275, 'samples': 255744, 'steps': 1331, 'loss/train': 3.404329299926758} +11/06/2021 21:27:41 - INFO - __main__ - Step 1333: {'lr': 0.000333, 'samples': 255936, 'steps': 1332, 'loss/train': 3.8690433502197266} +11/06/2021 21:27:42 - INFO - __main__ - Step 1334: {'lr': 0.00033325, 'samples': 256128, 'steps': 1333, 'loss/train': 3.4080007076263428} +11/06/2021 21:27:42 - INFO - __main__ - Step 1335: {'lr': 0.00033350000000000003, 'samples': 256320, 'steps': 1334, 'loss/train': 3.692984104156494} +11/06/2021 21:27:42 - INFO - __main__ - Step 1336: {'lr': 0.00033375, 'samples': 256512, 'steps': 1335, 'loss/train': 3.570852756500244} +11/06/2021 21:27:43 - INFO - __main__ - Step 1337: {'lr': 0.00033400000000000004, 'samples': 256704, 'steps': 1336, 'loss/train': 3.4716129302978516} +11/06/2021 21:27:43 - INFO - __main__ - Step 1338: {'lr': 0.00033425, 'samples': 256896, 'steps': 1337, 'loss/train': 3.4797582626342773} +11/06/2021 21:27:44 - INFO - __main__ - Step 1339: {'lr': 0.00033450000000000005, 'samples': 257088, 'steps': 1338, 'loss/train': 3.386270046234131} +11/06/2021 21:27:45 - INFO - __main__ - Step 1340: {'lr': 0.00033475, 'samples': 257280, 'steps': 1339, 'loss/train': 4.1568217277526855} +11/06/2021 21:27:45 - INFO - __main__ - Step 1341: {'lr': 0.000335, 'samples': 257472, 'steps': 1340, 'loss/train': 3.2953333854675293} +11/06/2021 21:27:45 - INFO - __main__ - Step 1342: {'lr': 0.00033525, 'samples': 257664, 'steps': 1341, 'loss/train': 3.355146646499634} +11/06/2021 21:27:46 - INFO - __main__ - Step 1343: {'lr': 0.0003355, 'samples': 257856, 'steps': 1342, 'loss/train': 3.234477996826172} +11/06/2021 21:27:47 - INFO - __main__ - Step 1344: {'lr': 0.00033575, 'samples': 258048, 'steps': 1343, 'loss/train': 3.457892656326294} +11/06/2021 21:27:47 - INFO - __main__ - Step 1345: {'lr': 0.00033600000000000004, 'samples': 258240, 'steps': 1344, 'loss/train': 3.948150634765625} +11/06/2021 21:27:47 - INFO - __main__ - Step 1346: {'lr': 0.00033625, 'samples': 258432, 'steps': 1345, 'loss/train': 3.7880961894989014} +11/06/2021 21:27:48 - INFO - __main__ - Step 1347: {'lr': 0.00033650000000000005, 'samples': 258624, 'steps': 1346, 'loss/train': 3.310671329498291} +11/06/2021 21:27:48 - INFO - __main__ - Step 1348: {'lr': 0.00033675, 'samples': 258816, 'steps': 1347, 'loss/train': 3.0229480266571045} +11/06/2021 21:27:49 - INFO - __main__ - Step 1349: {'lr': 0.000337, 'samples': 259008, 'steps': 1348, 'loss/train': 3.778203010559082} +11/06/2021 21:27:50 - INFO - __main__ - Step 1350: {'lr': 0.00033725, 'samples': 259200, 'steps': 1349, 'loss/train': 3.488584280014038} +11/06/2021 21:27:50 - INFO - __main__ - Step 1351: {'lr': 0.0003375, 'samples': 259392, 'steps': 1350, 'loss/train': 2.763584613800049} +11/06/2021 21:27:50 - INFO - __main__ - Step 1352: {'lr': 0.00033775, 'samples': 259584, 'steps': 1351, 'loss/train': 3.3598763942718506} +11/06/2021 21:27:51 - INFO - __main__ - Step 1353: {'lr': 0.00033800000000000003, 'samples': 259776, 'steps': 1352, 'loss/train': 3.7228636741638184} +11/06/2021 21:27:51 - INFO - __main__ - Step 1354: {'lr': 0.00033825, 'samples': 259968, 'steps': 1353, 'loss/train': 4.054864883422852} +11/06/2021 21:27:52 - INFO - __main__ - Step 1355: {'lr': 0.00033850000000000004, 'samples': 260160, 'steps': 1354, 'loss/train': 3.6283679008483887} +11/06/2021 21:27:53 - INFO - __main__ - Step 1356: {'lr': 0.00033875, 'samples': 260352, 'steps': 1355, 'loss/train': 3.3796229362487793} +11/06/2021 21:27:53 - INFO - __main__ - Step 1357: {'lr': 0.00033900000000000005, 'samples': 260544, 'steps': 1356, 'loss/train': 3.939152717590332} +11/06/2021 21:27:53 - INFO - __main__ - Step 1358: {'lr': 0.00033925, 'samples': 260736, 'steps': 1357, 'loss/train': 4.031463623046875} +11/06/2021 21:27:54 - INFO - __main__ - Step 1359: {'lr': 0.0003395, 'samples': 260928, 'steps': 1358, 'loss/train': 4.39647912979126} +11/06/2021 21:27:55 - INFO - __main__ - Step 1360: {'lr': 0.00033975, 'samples': 261120, 'steps': 1359, 'loss/train': 3.659208059310913} +11/06/2021 21:27:55 - INFO - __main__ - Step 1361: {'lr': 0.00034, 'samples': 261312, 'steps': 1360, 'loss/train': 4.465490341186523} +11/06/2021 21:27:55 - INFO - __main__ - Step 1362: {'lr': 0.00034025, 'samples': 261504, 'steps': 1361, 'loss/train': 4.4638543128967285} +11/06/2021 21:27:56 - INFO - __main__ - Step 1363: {'lr': 0.00034050000000000004, 'samples': 261696, 'steps': 1362, 'loss/train': 4.332038402557373} +11/06/2021 21:27:56 - INFO - __main__ - Step 1364: {'lr': 0.00034075, 'samples': 261888, 'steps': 1363, 'loss/train': 4.257739543914795} +11/06/2021 21:27:57 - INFO - __main__ - Step 1365: {'lr': 0.00034100000000000005, 'samples': 262080, 'steps': 1364, 'loss/train': 3.7311654090881348} +11/06/2021 21:27:57 - INFO - __main__ - Step 1366: {'lr': 0.00034125000000000003, 'samples': 262272, 'steps': 1365, 'loss/train': 3.6005234718322754} +11/06/2021 21:27:58 - INFO - __main__ - Step 1367: {'lr': 0.0003415, 'samples': 262464, 'steps': 1366, 'loss/train': 3.586486339569092} +11/06/2021 21:27:58 - INFO - __main__ - Step 1368: {'lr': 0.00034175, 'samples': 262656, 'steps': 1367, 'loss/train': 2.7847213745117188} +11/06/2021 21:27:59 - INFO - __main__ - Step 1369: {'lr': 0.000342, 'samples': 262848, 'steps': 1368, 'loss/train': 3.146930456161499} +11/06/2021 21:28:00 - INFO - __main__ - Step 1370: {'lr': 0.00034225, 'samples': 263040, 'steps': 1369, 'loss/train': 3.4413974285125732} +11/06/2021 21:28:00 - INFO - __main__ - Step 1371: {'lr': 0.00034250000000000003, 'samples': 263232, 'steps': 1370, 'loss/train': 3.6233880519866943} +11/06/2021 21:28:00 - INFO - __main__ - Step 1372: {'lr': 0.00034275, 'samples': 263424, 'steps': 1371, 'loss/train': 3.721611261367798} +11/06/2021 21:28:01 - INFO - __main__ - Step 1373: {'lr': 0.00034300000000000004, 'samples': 263616, 'steps': 1372, 'loss/train': 4.222573757171631} +11/06/2021 21:28:01 - INFO - __main__ - Step 1374: {'lr': 0.00034325, 'samples': 263808, 'steps': 1373, 'loss/train': 3.599992513656616} +11/06/2021 21:28:02 - INFO - __main__ - Step 1375: {'lr': 0.00034350000000000006, 'samples': 264000, 'steps': 1374, 'loss/train': 3.8981473445892334} +11/06/2021 21:28:03 - INFO - __main__ - Step 1376: {'lr': 0.00034375, 'samples': 264192, 'steps': 1375, 'loss/train': 3.6449296474456787} +11/06/2021 21:28:03 - INFO - __main__ - Step 1377: {'lr': 0.00034399999999999996, 'samples': 264384, 'steps': 1376, 'loss/train': 3.2894580364227295} +11/06/2021 21:28:03 - INFO - __main__ - Step 1378: {'lr': 0.00034425, 'samples': 264576, 'steps': 1377, 'loss/train': 3.513908624649048} +11/06/2021 21:28:04 - INFO - __main__ - Step 1379: {'lr': 0.00034449999999999997, 'samples': 264768, 'steps': 1378, 'loss/train': 4.0787034034729} +11/06/2021 21:28:05 - INFO - __main__ - Step 1380: {'lr': 0.00034475, 'samples': 264960, 'steps': 1379, 'loss/train': 3.7418301105499268} +11/06/2021 21:28:05 - INFO - __main__ - Step 1381: {'lr': 0.000345, 'samples': 265152, 'steps': 1380, 'loss/train': 3.700737237930298} +11/06/2021 21:28:05 - INFO - __main__ - Step 1382: {'lr': 0.00034525, 'samples': 265344, 'steps': 1381, 'loss/train': 3.3428897857666016} +11/06/2021 21:28:06 - INFO - __main__ - Step 1383: {'lr': 0.0003455, 'samples': 265536, 'steps': 1382, 'loss/train': 3.495915651321411} +11/06/2021 21:28:06 - INFO - __main__ - Step 1384: {'lr': 0.00034575000000000003, 'samples': 265728, 'steps': 1383, 'loss/train': 3.5448079109191895} +11/06/2021 21:28:07 - INFO - __main__ - Step 1385: {'lr': 0.000346, 'samples': 265920, 'steps': 1384, 'loss/train': 3.691251277923584} +11/06/2021 21:28:07 - INFO - __main__ - Step 1386: {'lr': 0.00034625, 'samples': 266112, 'steps': 1385, 'loss/train': 2.9062933921813965} +11/06/2021 21:28:08 - INFO - __main__ - Step 1387: {'lr': 0.00034649999999999997, 'samples': 266304, 'steps': 1386, 'loss/train': 3.5462396144866943} +11/06/2021 21:28:08 - INFO - __main__ - Step 1388: {'lr': 0.00034675, 'samples': 266496, 'steps': 1387, 'loss/train': 5.252135276794434} +11/06/2021 21:28:08 - INFO - __main__ - Step 1389: {'lr': 0.000347, 'samples': 266688, 'steps': 1388, 'loss/train': 3.7084007263183594} +11/06/2021 21:28:09 - INFO - __main__ - Step 1390: {'lr': 0.00034725, 'samples': 266880, 'steps': 1389, 'loss/train': 4.000763893127441} +11/06/2021 21:28:10 - INFO - __main__ - Step 1391: {'lr': 0.0003475, 'samples': 267072, 'steps': 1390, 'loss/train': 3.437042474746704} +11/06/2021 21:28:10 - INFO - __main__ - Step 1392: {'lr': 0.00034775, 'samples': 267264, 'steps': 1391, 'loss/train': 3.971050977706909} +11/06/2021 21:28:11 - INFO - __main__ - Step 1393: {'lr': 0.000348, 'samples': 267456, 'steps': 1392, 'loss/train': 3.698169231414795} +11/06/2021 21:28:11 - INFO - __main__ - Step 1394: {'lr': 0.00034825000000000004, 'samples': 267648, 'steps': 1393, 'loss/train': 3.2756340503692627} +11/06/2021 21:28:11 - INFO - __main__ - Step 1395: {'lr': 0.00034849999999999996, 'samples': 267840, 'steps': 1394, 'loss/train': 3.3742105960845947} +11/06/2021 21:28:12 - INFO - __main__ - Step 1396: {'lr': 0.00034875, 'samples': 268032, 'steps': 1395, 'loss/train': 3.8026742935180664} +11/06/2021 21:28:13 - INFO - __main__ - Step 1397: {'lr': 0.00034899999999999997, 'samples': 268224, 'steps': 1396, 'loss/train': 3.521596908569336} +11/06/2021 21:28:13 - INFO - __main__ - Step 1398: {'lr': 0.00034925, 'samples': 268416, 'steps': 1397, 'loss/train': 3.4449994564056396} +11/06/2021 21:28:13 - INFO - __main__ - Step 1399: {'lr': 0.0003495, 'samples': 268608, 'steps': 1398, 'loss/train': 3.146643877029419} +11/06/2021 21:28:14 - INFO - __main__ - Step 1400: {'lr': 0.00034975, 'samples': 268800, 'steps': 1399, 'loss/train': 3.3726940155029297} +11/06/2021 21:28:15 - INFO - __main__ - Step 1401: {'lr': 0.00035, 'samples': 268992, 'steps': 1400, 'loss/train': 3.4211158752441406} +11/06/2021 21:28:15 - INFO - __main__ - Step 1402: {'lr': 0.00035025000000000003, 'samples': 269184, 'steps': 1401, 'loss/train': 3.7196311950683594} +11/06/2021 21:28:15 - INFO - __main__ - Step 1403: {'lr': 0.0003505, 'samples': 269376, 'steps': 1402, 'loss/train': 3.6825990676879883} +11/06/2021 21:28:16 - INFO - __main__ - Step 1404: {'lr': 0.00035075, 'samples': 269568, 'steps': 1403, 'loss/train': 3.5246872901916504} +11/06/2021 21:28:16 - INFO - __main__ - Step 1405: {'lr': 0.00035099999999999997, 'samples': 269760, 'steps': 1404, 'loss/train': 3.948554277420044} +11/06/2021 21:28:17 - INFO - __main__ - Step 1406: {'lr': 0.00035125, 'samples': 269952, 'steps': 1405, 'loss/train': 3.4808645248413086} +11/06/2021 21:28:18 - INFO - __main__ - Step 1407: {'lr': 0.0003515, 'samples': 270144, 'steps': 1406, 'loss/train': 3.6043059825897217} +11/06/2021 21:28:18 - INFO - __main__ - Step 1408: {'lr': 0.00035175, 'samples': 270336, 'steps': 1407, 'loss/train': 3.91089129447937} +11/06/2021 21:28:18 - INFO - __main__ - Step 1409: {'lr': 0.000352, 'samples': 270528, 'steps': 1408, 'loss/train': 3.544276237487793} +11/06/2021 21:28:19 - INFO - __main__ - Step 1410: {'lr': 0.00035225, 'samples': 270720, 'steps': 1409, 'loss/train': 3.8686203956604004} +11/06/2021 21:28:20 - INFO - __main__ - Step 1411: {'lr': 0.0003525, 'samples': 270912, 'steps': 1410, 'loss/train': 3.5301620960235596} +11/06/2021 21:28:20 - INFO - __main__ - Step 1412: {'lr': 0.00035275000000000004, 'samples': 271104, 'steps': 1411, 'loss/train': 3.6756720542907715} +11/06/2021 21:28:21 - INFO - __main__ - Step 1413: {'lr': 0.00035299999999999996, 'samples': 271296, 'steps': 1412, 'loss/train': 3.3864593505859375} +11/06/2021 21:28:21 - INFO - __main__ - Step 1414: {'lr': 0.00035325, 'samples': 271488, 'steps': 1413, 'loss/train': 3.0657331943511963} +11/06/2021 21:28:21 - INFO - __main__ - Step 1415: {'lr': 0.0003535, 'samples': 271680, 'steps': 1414, 'loss/train': 3.454667091369629} +11/06/2021 21:28:22 - INFO - __main__ - Step 1416: {'lr': 0.00035375, 'samples': 271872, 'steps': 1415, 'loss/train': 3.242163896560669} +11/06/2021 21:28:23 - INFO - __main__ - Step 1417: {'lr': 0.000354, 'samples': 272064, 'steps': 1416, 'loss/train': 3.9992828369140625} +11/06/2021 21:28:23 - INFO - __main__ - Step 1418: {'lr': 0.00035425, 'samples': 272256, 'steps': 1417, 'loss/train': 3.688415050506592} +11/06/2021 21:28:23 - INFO - __main__ - Step 1419: {'lr': 0.0003545, 'samples': 272448, 'steps': 1418, 'loss/train': 3.7804338932037354} +11/06/2021 21:28:24 - INFO - __main__ - Step 1420: {'lr': 0.00035475000000000003, 'samples': 272640, 'steps': 1419, 'loss/train': 3.729741096496582} +11/06/2021 21:28:25 - INFO - __main__ - Step 1421: {'lr': 0.000355, 'samples': 272832, 'steps': 1420, 'loss/train': 4.303407192230225} +11/06/2021 21:28:25 - INFO - __main__ - Step 1422: {'lr': 0.00035525000000000004, 'samples': 273024, 'steps': 1421, 'loss/train': 3.4556620121002197} +11/06/2021 21:28:26 - INFO - __main__ - Step 1423: {'lr': 0.00035549999999999997, 'samples': 273216, 'steps': 1422, 'loss/train': 2.991054058074951} +11/06/2021 21:28:26 - INFO - __main__ - Step 1424: {'lr': 0.00035575, 'samples': 273408, 'steps': 1423, 'loss/train': 4.185265064239502} +11/06/2021 21:28:26 - INFO - __main__ - Step 1425: {'lr': 0.000356, 'samples': 273600, 'steps': 1424, 'loss/train': 3.529508590698242} +11/06/2021 21:28:27 - INFO - __main__ - Step 1426: {'lr': 0.00035625, 'samples': 273792, 'steps': 1425, 'loss/train': 3.394829034805298} +11/06/2021 21:28:28 - INFO - __main__ - Step 1427: {'lr': 0.0003565, 'samples': 273984, 'steps': 1426, 'loss/train': 4.052621364593506} +11/06/2021 21:28:28 - INFO - __main__ - Step 1428: {'lr': 0.00035675, 'samples': 274176, 'steps': 1427, 'loss/train': 3.0512208938598633} +11/06/2021 21:28:28 - INFO - __main__ - Step 1429: {'lr': 0.000357, 'samples': 274368, 'steps': 1428, 'loss/train': 3.3234691619873047} +11/06/2021 21:28:29 - INFO - __main__ - Step 1430: {'lr': 0.00035725000000000004, 'samples': 274560, 'steps': 1429, 'loss/train': 3.588322162628174} +11/06/2021 21:28:29 - INFO - __main__ - Step 1431: {'lr': 0.0003575, 'samples': 274752, 'steps': 1430, 'loss/train': 3.39493727684021} +11/06/2021 21:28:30 - INFO - __main__ - Step 1432: {'lr': 0.00035775, 'samples': 274944, 'steps': 1431, 'loss/train': 2.880502939224243} +11/06/2021 21:28:30 - INFO - __main__ - Step 1433: {'lr': 0.000358, 'samples': 275136, 'steps': 1432, 'loss/train': 3.7747838497161865} +11/06/2021 21:28:31 - INFO - __main__ - Step 1434: {'lr': 0.00035825, 'samples': 275328, 'steps': 1433, 'loss/train': 3.3060061931610107} +11/06/2021 21:28:31 - INFO - __main__ - Step 1435: {'lr': 0.0003585, 'samples': 275520, 'steps': 1434, 'loss/train': 3.7018392086029053} +11/06/2021 21:28:32 - INFO - __main__ - Step 1436: {'lr': 0.00035875, 'samples': 275712, 'steps': 1435, 'loss/train': 3.0778818130493164} +11/06/2021 21:28:33 - INFO - __main__ - Step 1437: {'lr': 0.000359, 'samples': 275904, 'steps': 1436, 'loss/train': 3.736198902130127} +11/06/2021 21:28:33 - INFO - __main__ - Step 1438: {'lr': 0.00035925000000000003, 'samples': 276096, 'steps': 1437, 'loss/train': 3.045379877090454} +11/06/2021 21:28:33 - INFO - __main__ - Step 1439: {'lr': 0.0003595, 'samples': 276288, 'steps': 1438, 'loss/train': 3.695364475250244} +11/06/2021 21:28:34 - INFO - __main__ - Step 1440: {'lr': 0.00035975000000000004, 'samples': 276480, 'steps': 1439, 'loss/train': 3.711172342300415} +11/06/2021 21:28:34 - INFO - __main__ - Step 1441: {'lr': 0.00035999999999999997, 'samples': 276672, 'steps': 1440, 'loss/train': 2.9761195182800293} +11/06/2021 21:28:35 - INFO - __main__ - Step 1442: {'lr': 0.00036025, 'samples': 276864, 'steps': 1441, 'loss/train': 3.2470874786376953} +11/06/2021 21:28:35 - INFO - __main__ - Step 1443: {'lr': 0.0003605, 'samples': 277056, 'steps': 1442, 'loss/train': 3.0125174522399902} +11/06/2021 21:28:36 - INFO - __main__ - Step 1444: {'lr': 0.00036075, 'samples': 277248, 'steps': 1443, 'loss/train': 3.5066580772399902} +11/06/2021 21:28:36 - INFO - __main__ - Step 1445: {'lr': 0.000361, 'samples': 277440, 'steps': 1444, 'loss/train': 3.245635747909546} +11/06/2021 21:28:36 - INFO - __main__ - Step 1446: {'lr': 0.00036125, 'samples': 277632, 'steps': 1445, 'loss/train': 4.3313374519348145} +11/06/2021 21:28:38 - INFO - __main__ - Step 1447: {'lr': 0.0003615, 'samples': 277824, 'steps': 1446, 'loss/train': 3.90049409866333} +11/06/2021 21:28:38 - INFO - __main__ - Step 1448: {'lr': 0.00036175000000000004, 'samples': 278016, 'steps': 1447, 'loss/train': 2.849242687225342} +11/06/2021 21:28:38 - INFO - __main__ - Step 1449: {'lr': 0.000362, 'samples': 278208, 'steps': 1448, 'loss/train': 3.8985612392425537} +11/06/2021 21:28:39 - INFO - __main__ - Step 1450: {'lr': 0.00036225000000000005, 'samples': 278400, 'steps': 1449, 'loss/train': 3.1428816318511963} +11/06/2021 21:28:39 - INFO - __main__ - Step 1451: {'lr': 0.0003625, 'samples': 278592, 'steps': 1450, 'loss/train': 3.8840200901031494} +11/06/2021 21:28:39 - INFO - __main__ - Step 1452: {'lr': 0.00036275, 'samples': 278784, 'steps': 1451, 'loss/train': 3.16904354095459} +11/06/2021 21:28:40 - INFO - __main__ - Step 1453: {'lr': 0.000363, 'samples': 278976, 'steps': 1452, 'loss/train': 2.8679397106170654} +11/06/2021 21:28:41 - INFO - __main__ - Step 1454: {'lr': 0.00036325, 'samples': 279168, 'steps': 1453, 'loss/train': 3.2666327953338623} +11/06/2021 21:28:41 - INFO - __main__ - Step 1455: {'lr': 0.0003635, 'samples': 279360, 'steps': 1454, 'loss/train': 3.257840871810913} +11/06/2021 21:28:41 - INFO - __main__ - Step 1456: {'lr': 0.00036375000000000003, 'samples': 279552, 'steps': 1455, 'loss/train': 3.4981942176818848} +11/06/2021 21:28:42 - INFO - __main__ - Step 1457: {'lr': 0.000364, 'samples': 279744, 'steps': 1456, 'loss/train': 3.474823236465454} +11/06/2021 21:28:43 - INFO - __main__ - Step 1458: {'lr': 0.00036425000000000004, 'samples': 279936, 'steps': 1457, 'loss/train': 3.6593263149261475} +11/06/2021 21:28:43 - INFO - __main__ - Step 1459: {'lr': 0.0003645, 'samples': 280128, 'steps': 1458, 'loss/train': 3.4789998531341553} +11/06/2021 21:28:43 - INFO - __main__ - Step 1460: {'lr': 0.00036475, 'samples': 280320, 'steps': 1459, 'loss/train': 3.415144920349121} +11/06/2021 21:28:44 - INFO - __main__ - Step 1461: {'lr': 0.000365, 'samples': 280512, 'steps': 1460, 'loss/train': 3.892705202102661} +11/06/2021 21:28:44 - INFO - __main__ - Step 1462: {'lr': 0.00036525, 'samples': 280704, 'steps': 1461, 'loss/train': 3.5692012310028076} +11/06/2021 21:28:45 - INFO - __main__ - Step 1463: {'lr': 0.0003655, 'samples': 280896, 'steps': 1462, 'loss/train': 3.964817762374878} +11/06/2021 21:28:46 - INFO - __main__ - Step 1464: {'lr': 0.00036575, 'samples': 281088, 'steps': 1463, 'loss/train': 3.4829154014587402} +11/06/2021 21:28:46 - INFO - __main__ - Step 1465: {'lr': 0.000366, 'samples': 281280, 'steps': 1464, 'loss/train': 3.2892184257507324} +11/06/2021 21:28:46 - INFO - __main__ - Step 1466: {'lr': 0.00036625000000000004, 'samples': 281472, 'steps': 1465, 'loss/train': 3.158153772354126} +11/06/2021 21:28:47 - INFO - __main__ - Step 1467: {'lr': 0.0003665, 'samples': 281664, 'steps': 1466, 'loss/train': 3.4137485027313232} +11/06/2021 21:28:48 - INFO - __main__ - Step 1468: {'lr': 0.00036675000000000005, 'samples': 281856, 'steps': 1467, 'loss/train': 3.1349167823791504} +11/06/2021 21:28:48 - INFO - __main__ - Step 1469: {'lr': 0.000367, 'samples': 282048, 'steps': 1468, 'loss/train': 2.7978010177612305} +11/06/2021 21:28:48 - INFO - __main__ - Step 1470: {'lr': 0.00036725, 'samples': 282240, 'steps': 1469, 'loss/train': 3.418675184249878} +11/06/2021 21:28:49 - INFO - __main__ - Step 1471: {'lr': 0.0003675, 'samples': 282432, 'steps': 1470, 'loss/train': 3.3369407653808594} +11/06/2021 21:28:49 - INFO - __main__ - Step 1472: {'lr': 0.00036775, 'samples': 282624, 'steps': 1471, 'loss/train': 3.0756335258483887} +11/06/2021 21:28:50 - INFO - __main__ - Step 1473: {'lr': 0.000368, 'samples': 282816, 'steps': 1472, 'loss/train': 3.3924009799957275} +11/06/2021 21:28:51 - INFO - __main__ - Step 1474: {'lr': 0.00036825000000000003, 'samples': 283008, 'steps': 1473, 'loss/train': 3.3130877017974854} +11/06/2021 21:28:51 - INFO - __main__ - Step 1475: {'lr': 0.0003685, 'samples': 283200, 'steps': 1474, 'loss/train': 2.7034976482391357} +11/06/2021 21:28:51 - INFO - __main__ - Step 1476: {'lr': 0.00036875000000000005, 'samples': 283392, 'steps': 1475, 'loss/train': 2.9324753284454346} +11/06/2021 21:28:52 - INFO - __main__ - Step 1477: {'lr': 0.000369, 'samples': 283584, 'steps': 1476, 'loss/train': 3.632042407989502} +11/06/2021 21:28:53 - INFO - __main__ - Step 1478: {'lr': 0.00036925, 'samples': 283776, 'steps': 1477, 'loss/train': 3.7734642028808594} +11/06/2021 21:28:54 - INFO - __main__ - Step 1479: {'lr': 0.0003695, 'samples': 283968, 'steps': 1478, 'loss/train': 3.285372018814087} +11/06/2021 21:28:54 - INFO - __main__ - Step 1480: {'lr': 0.00036975, 'samples': 284160, 'steps': 1479, 'loss/train': 3.5449750423431396} +11/06/2021 21:28:54 - INFO - __main__ - Step 1481: {'lr': 0.00037, 'samples': 284352, 'steps': 1480, 'loss/train': 3.1665492057800293} +11/06/2021 21:28:55 - INFO - __main__ - Step 1482: {'lr': 0.00037025000000000003, 'samples': 284544, 'steps': 1481, 'loss/train': 2.68510103225708} +11/06/2021 21:28:55 - INFO - __main__ - Step 1483: {'lr': 0.0003705, 'samples': 284736, 'steps': 1482, 'loss/train': 3.09177303314209} +11/06/2021 21:28:56 - INFO - __main__ - Step 1484: {'lr': 0.00037075000000000004, 'samples': 284928, 'steps': 1483, 'loss/train': 0.934282124042511} +11/06/2021 21:28:57 - INFO - __main__ - Step 1485: {'lr': 0.000371, 'samples': 285120, 'steps': 1484, 'loss/train': 0.7881891131401062} +11/06/2021 21:28:57 - INFO - __main__ - Step 1486: {'lr': 0.00037125000000000005, 'samples': 285312, 'steps': 1485, 'loss/train': 3.3031082153320312} +11/06/2021 21:28:58 - INFO - __main__ - Step 1487: {'lr': 0.00037150000000000003, 'samples': 285504, 'steps': 1486, 'loss/train': 3.4887430667877197} +11/06/2021 21:28:58 - INFO - __main__ - Step 1488: {'lr': 0.00037175, 'samples': 285696, 'steps': 1487, 'loss/train': 3.392094850540161} +11/06/2021 21:28:58 - INFO - __main__ - Step 1489: {'lr': 0.000372, 'samples': 285888, 'steps': 1488, 'loss/train': 3.5077946186065674} +11/06/2021 21:28:59 - INFO - __main__ - Step 1490: {'lr': 0.00037225, 'samples': 286080, 'steps': 1489, 'loss/train': 3.9329774379730225} +11/06/2021 21:29:00 - INFO - __main__ - Step 1491: {'lr': 0.0003725, 'samples': 286272, 'steps': 1490, 'loss/train': 3.5324740409851074} +11/06/2021 21:29:00 - INFO - __main__ - Step 1492: {'lr': 0.00037275000000000003, 'samples': 286464, 'steps': 1491, 'loss/train': 2.4463398456573486} +11/06/2021 21:29:00 - INFO - __main__ - Step 1493: {'lr': 0.000373, 'samples': 286656, 'steps': 1492, 'loss/train': 3.127577066421509} +11/06/2021 21:29:01 - INFO - __main__ - Step 1494: {'lr': 0.00037325000000000005, 'samples': 286848, 'steps': 1493, 'loss/train': 1.6627174615859985} +11/06/2021 21:29:03 - INFO - __main__ - Step 1495: {'lr': 0.0003735, 'samples': 287040, 'steps': 1494, 'loss/train': 3.5371575355529785} +11/06/2021 21:29:03 - INFO - __main__ - Step 1496: {'lr': 0.00037375000000000006, 'samples': 287232, 'steps': 1495, 'loss/train': 3.178628921508789} +11/06/2021 21:29:03 - INFO - __main__ - Step 1497: {'lr': 0.000374, 'samples': 287424, 'steps': 1496, 'loss/train': 2.7111098766326904} +11/06/2021 21:29:04 - INFO - __main__ - Step 1498: {'lr': 0.00037425, 'samples': 287616, 'steps': 1497, 'loss/train': 4.202212810516357} +11/06/2021 21:29:04 - INFO - __main__ - Step 1499: {'lr': 0.0003745, 'samples': 287808, 'steps': 1498, 'loss/train': 3.379865884780884} +11/06/2021 21:29:04 - INFO - __main__ - Step 1500: {'lr': 0.00037475000000000003, 'samples': 288000, 'steps': 1499, 'loss/train': 3.4952762126922607} +11/06/2021 21:29:05 - INFO - __main__ - Step 1501: {'lr': 0.000375, 'samples': 288192, 'steps': 1500, 'loss/train': 4.174196720123291} +11/06/2021 21:29:06 - INFO - __main__ - Step 1502: {'lr': 0.00037525, 'samples': 288384, 'steps': 1501, 'loss/train': 3.272667169570923} +11/06/2021 21:29:06 - INFO - __main__ - Step 1503: {'lr': 0.0003755, 'samples': 288576, 'steps': 1502, 'loss/train': 2.8478939533233643} +11/06/2021 21:29:07 - INFO - __main__ - Step 1504: {'lr': 0.00037575, 'samples': 288768, 'steps': 1503, 'loss/train': 4.3909077644348145} +11/06/2021 21:29:07 - INFO - __main__ - Step 1505: {'lr': 0.00037600000000000003, 'samples': 288960, 'steps': 1504, 'loss/train': 3.602169990539551} +11/06/2021 21:29:08 - INFO - __main__ - Step 1506: {'lr': 0.00037624999999999996, 'samples': 289152, 'steps': 1505, 'loss/train': 3.1311495304107666} +11/06/2021 21:29:08 - INFO - __main__ - Step 1507: {'lr': 0.0003765, 'samples': 289344, 'steps': 1506, 'loss/train': 2.88991379737854} +11/06/2021 21:29:09 - INFO - __main__ - Step 1508: {'lr': 0.00037674999999999997, 'samples': 289536, 'steps': 1507, 'loss/train': 2.8797428607940674} +11/06/2021 21:29:09 - INFO - __main__ - Step 1509: {'lr': 0.000377, 'samples': 289728, 'steps': 1508, 'loss/train': 3.3940863609313965} +11/06/2021 21:29:09 - INFO - __main__ - Step 1510: {'lr': 0.00037725, 'samples': 289920, 'steps': 1509, 'loss/train': 3.036484479904175} +11/06/2021 21:29:10 - INFO - __main__ - Step 1511: {'lr': 0.0003775, 'samples': 290112, 'steps': 1510, 'loss/train': 4.253868579864502} +11/06/2021 21:29:11 - INFO - __main__ - Step 1512: {'lr': 0.00037775, 'samples': 290304, 'steps': 1511, 'loss/train': 3.5372188091278076} +11/06/2021 21:29:11 - INFO - __main__ - Step 1513: {'lr': 0.000378, 'samples': 290496, 'steps': 1512, 'loss/train': 3.0633351802825928} +11/06/2021 21:29:12 - INFO - __main__ - Step 1514: {'lr': 0.00037825, 'samples': 290688, 'steps': 1513, 'loss/train': 3.378868818283081} +11/06/2021 21:29:12 - INFO - __main__ - Step 1515: {'lr': 0.0003785, 'samples': 290880, 'steps': 1514, 'loss/train': 4.058987140655518} +11/06/2021 21:29:12 - INFO - __main__ - Step 1516: {'lr': 0.00037874999999999996, 'samples': 291072, 'steps': 1515, 'loss/train': 3.8939054012298584} +11/06/2021 21:29:14 - INFO - __main__ - Step 1517: {'lr': 0.000379, 'samples': 291264, 'steps': 1516, 'loss/train': 3.405064344406128} +11/06/2021 21:29:15 - INFO - __main__ - Step 1518: {'lr': 0.00037925, 'samples': 291456, 'steps': 1517, 'loss/train': 3.7268097400665283} +11/06/2021 21:29:15 - INFO - __main__ - Step 1519: {'lr': 0.0003795, 'samples': 291648, 'steps': 1518, 'loss/train': 3.949538469314575} +11/06/2021 21:29:16 - INFO - __main__ - Step 1520: {'lr': 0.00037975, 'samples': 291840, 'steps': 1519, 'loss/train': 2.9000167846679688} +11/06/2021 21:29:16 - INFO - __main__ - Step 1521: {'lr': 0.00038, 'samples': 292032, 'steps': 1520, 'loss/train': 1.4307708740234375} +11/06/2021 21:29:16 - INFO - __main__ - Step 1522: {'lr': 0.00038025, 'samples': 292224, 'steps': 1521, 'loss/train': 1.3860046863555908} +11/06/2021 21:29:17 - INFO - __main__ - Step 1523: {'lr': 0.00038050000000000003, 'samples': 292416, 'steps': 1522, 'loss/train': 1.1130292415618896} +11/06/2021 21:29:18 - INFO - __main__ - Step 1524: {'lr': 0.00038075, 'samples': 292608, 'steps': 1523, 'loss/train': 3.4155771732330322} +11/06/2021 21:29:18 - INFO - __main__ - Step 1525: {'lr': 0.000381, 'samples': 292800, 'steps': 1524, 'loss/train': 3.0278680324554443} +11/06/2021 21:29:19 - INFO - __main__ - Step 1526: {'lr': 0.00038124999999999997, 'samples': 292992, 'steps': 1525, 'loss/train': 3.4204211235046387} +11/06/2021 21:29:19 - INFO - __main__ - Step 1527: {'lr': 0.0003815, 'samples': 293184, 'steps': 1526, 'loss/train': 2.968132972717285} +11/06/2021 21:29:19 - INFO - __main__ - Step 1528: {'lr': 0.00038175, 'samples': 293376, 'steps': 1527, 'loss/train': 3.8879196643829346} +11/06/2021 21:29:20 - INFO - __main__ - Step 1529: {'lr': 0.000382, 'samples': 293568, 'steps': 1528, 'loss/train': 3.570026159286499} +11/06/2021 21:29:21 - INFO - __main__ - Step 1530: {'lr': 0.00038225, 'samples': 293760, 'steps': 1529, 'loss/train': 3.1837944984436035} +11/06/2021 21:29:21 - INFO - __main__ - Step 1531: {'lr': 0.00038250000000000003, 'samples': 293952, 'steps': 1530, 'loss/train': 2.6540393829345703} +11/06/2021 21:29:22 - INFO - __main__ - Step 1532: {'lr': 0.00038275, 'samples': 294144, 'steps': 1531, 'loss/train': 2.824615478515625} +11/06/2021 21:29:22 - INFO - __main__ - Step 1533: {'lr': 0.00038300000000000004, 'samples': 294336, 'steps': 1532, 'loss/train': 2.8562939167022705} +11/06/2021 21:29:23 - INFO - __main__ - Step 1534: {'lr': 0.00038324999999999996, 'samples': 294528, 'steps': 1533, 'loss/train': 3.2858169078826904} +11/06/2021 21:29:23 - INFO - __main__ - Step 1535: {'lr': 0.0003835, 'samples': 294720, 'steps': 1534, 'loss/train': 3.5091545581817627} +11/06/2021 21:29:24 - INFO - __main__ - Step 1536: {'lr': 0.00038375, 'samples': 294912, 'steps': 1535, 'loss/train': 3.2510337829589844} +11/06/2021 21:29:24 - INFO - __main__ - Step 1537: {'lr': 0.000384, 'samples': 295104, 'steps': 1536, 'loss/train': 3.5380523204803467} +11/06/2021 21:29:24 - INFO - __main__ - Step 1538: {'lr': 0.00038425, 'samples': 295296, 'steps': 1537, 'loss/train': 2.9871280193328857} +11/06/2021 21:29:25 - INFO - __main__ - Step 1539: {'lr': 0.0003845, 'samples': 295488, 'steps': 1538, 'loss/train': 3.5664308071136475} +11/06/2021 21:29:26 - INFO - __main__ - Step 1540: {'lr': 0.00038475, 'samples': 295680, 'steps': 1539, 'loss/train': 3.1113128662109375} +11/06/2021 21:29:26 - INFO - __main__ - Step 1541: {'lr': 0.00038500000000000003, 'samples': 295872, 'steps': 1540, 'loss/train': 4.263197422027588} +11/06/2021 21:29:26 - INFO - __main__ - Step 1542: {'lr': 0.00038525, 'samples': 296064, 'steps': 1541, 'loss/train': 3.313586711883545} +11/06/2021 21:29:27 - INFO - __main__ - Step 1543: {'lr': 0.0003855, 'samples': 296256, 'steps': 1542, 'loss/train': 3.427462100982666} +11/06/2021 21:29:27 - INFO - __main__ - Step 1544: {'lr': 0.00038574999999999997, 'samples': 296448, 'steps': 1543, 'loss/train': 4.165167808532715} +11/06/2021 21:29:28 - INFO - __main__ - Step 1545: {'lr': 0.000386, 'samples': 296640, 'steps': 1544, 'loss/train': 3.6539011001586914} +11/06/2021 21:29:29 - INFO - __main__ - Step 1546: {'lr': 0.00038625, 'samples': 296832, 'steps': 1545, 'loss/train': 3.510122060775757} +11/06/2021 21:29:29 - INFO - __main__ - Step 1547: {'lr': 0.0003865, 'samples': 297024, 'steps': 1546, 'loss/train': 3.2956809997558594} +11/06/2021 21:29:29 - INFO - __main__ - Step 1548: {'lr': 0.00038675, 'samples': 297216, 'steps': 1547, 'loss/train': 3.2712979316711426} +11/06/2021 21:29:30 - INFO - __main__ - Step 1549: {'lr': 0.00038700000000000003, 'samples': 297408, 'steps': 1548, 'loss/train': 2.8422179222106934} +11/06/2021 21:29:31 - INFO - __main__ - Step 1550: {'lr': 0.00038725, 'samples': 297600, 'steps': 1549, 'loss/train': 3.2148244380950928} +11/06/2021 21:29:31 - INFO - __main__ - Step 1551: {'lr': 0.00038750000000000004, 'samples': 297792, 'steps': 1550, 'loss/train': 3.082228422164917} +11/06/2021 21:29:31 - INFO - __main__ - Step 1552: {'lr': 0.00038774999999999997, 'samples': 297984, 'steps': 1551, 'loss/train': 3.0857651233673096} +11/06/2021 21:29:32 - INFO - __main__ - Step 1553: {'lr': 0.000388, 'samples': 298176, 'steps': 1552, 'loss/train': 3.537327289581299} +11/06/2021 21:29:32 - INFO - __main__ - Step 1554: {'lr': 0.00038825, 'samples': 298368, 'steps': 1553, 'loss/train': 3.118391275405884} +11/06/2021 21:29:33 - INFO - __main__ - Step 1555: {'lr': 0.0003885, 'samples': 298560, 'steps': 1554, 'loss/train': 3.2976584434509277} +11/06/2021 21:29:34 - INFO - __main__ - Step 1556: {'lr': 0.00038875, 'samples': 298752, 'steps': 1555, 'loss/train': 3.208622694015503} +11/06/2021 21:29:34 - INFO - __main__ - Step 1557: {'lr': 0.000389, 'samples': 298944, 'steps': 1556, 'loss/train': 2.393932580947876} +11/06/2021 21:29:35 - INFO - __main__ - Step 1558: {'lr': 0.00038925, 'samples': 299136, 'steps': 1557, 'loss/train': 3.1180825233459473} +11/06/2021 21:29:35 - INFO - __main__ - Step 1559: {'lr': 0.00038950000000000003, 'samples': 299328, 'steps': 1558, 'loss/train': 3.363607406616211} +11/06/2021 21:29:35 - INFO - __main__ - Step 1560: {'lr': 0.00038975, 'samples': 299520, 'steps': 1559, 'loss/train': 3.7669551372528076} +11/06/2021 21:29:36 - INFO - __main__ - Step 1561: {'lr': 0.00039000000000000005, 'samples': 299712, 'steps': 1560, 'loss/train': 2.959444284439087} +11/06/2021 21:29:37 - INFO - __main__ - Step 1562: {'lr': 0.00039024999999999997, 'samples': 299904, 'steps': 1561, 'loss/train': 3.453453779220581} +11/06/2021 21:29:37 - INFO - __main__ - Step 1563: {'lr': 0.0003905, 'samples': 300096, 'steps': 1562, 'loss/train': 3.2474799156188965} +11/06/2021 21:29:37 - INFO - __main__ - Step 1564: {'lr': 0.00039075, 'samples': 300288, 'steps': 1563, 'loss/train': 3.6809487342834473} +11/06/2021 21:29:38 - INFO - __main__ - Step 1565: {'lr': 0.000391, 'samples': 300480, 'steps': 1564, 'loss/train': 3.5540361404418945} +11/06/2021 21:29:39 - INFO - __main__ - Step 1566: {'lr': 0.00039125, 'samples': 300672, 'steps': 1565, 'loss/train': 3.8347136974334717} +11/06/2021 21:29:39 - INFO - __main__ - Step 1567: {'lr': 0.00039150000000000003, 'samples': 300864, 'steps': 1566, 'loss/train': 3.0421507358551025} +11/06/2021 21:29:40 - INFO - __main__ - Step 1568: {'lr': 0.00039175, 'samples': 301056, 'steps': 1567, 'loss/train': 2.8751606941223145} +11/06/2021 21:29:40 - INFO - __main__ - Step 1569: {'lr': 0.00039200000000000004, 'samples': 301248, 'steps': 1568, 'loss/train': 2.795197010040283} +11/06/2021 21:29:40 - INFO - __main__ - Step 1570: {'lr': 0.00039225, 'samples': 301440, 'steps': 1569, 'loss/train': 2.370975971221924} +11/06/2021 21:29:41 - INFO - __main__ - Step 1571: {'lr': 0.0003925, 'samples': 301632, 'steps': 1570, 'loss/train': 2.498239040374756} +11/06/2021 21:29:42 - INFO - __main__ - Step 1572: {'lr': 0.00039275, 'samples': 301824, 'steps': 1571, 'loss/train': 1.6988508701324463} +11/06/2021 21:29:42 - INFO - __main__ - Step 1573: {'lr': 0.000393, 'samples': 302016, 'steps': 1572, 'loss/train': 4.021992206573486} +11/06/2021 21:29:42 - INFO - __main__ - Step 1574: {'lr': 0.00039325, 'samples': 302208, 'steps': 1573, 'loss/train': 2.898738145828247} +11/06/2021 21:29:43 - INFO - __main__ - Step 1575: {'lr': 0.0003935, 'samples': 302400, 'steps': 1574, 'loss/train': 2.607938289642334} +11/06/2021 21:29:43 - INFO - __main__ - Step 1576: {'lr': 0.00039375, 'samples': 302592, 'steps': 1575, 'loss/train': 3.263978958129883} +11/06/2021 21:29:44 - INFO - __main__ - Step 1577: {'lr': 0.00039400000000000004, 'samples': 302784, 'steps': 1576, 'loss/train': 2.8440113067626953} +11/06/2021 21:29:44 - INFO - __main__ - Step 1578: {'lr': 0.00039425, 'samples': 302976, 'steps': 1577, 'loss/train': 3.6558189392089844} +11/06/2021 21:29:45 - INFO - __main__ - Step 1579: {'lr': 0.00039450000000000005, 'samples': 303168, 'steps': 1578, 'loss/train': 3.0387959480285645} +11/06/2021 21:29:45 - INFO - __main__ - Step 1580: {'lr': 0.00039474999999999997, 'samples': 303360, 'steps': 1579, 'loss/train': 3.356081008911133} +11/06/2021 21:29:46 - INFO - __main__ - Step 1581: {'lr': 0.000395, 'samples': 303552, 'steps': 1580, 'loss/train': 2.985703706741333} +11/06/2021 21:29:47 - INFO - __main__ - Step 1582: {'lr': 0.00039525, 'samples': 303744, 'steps': 1581, 'loss/train': 3.263591766357422} +11/06/2021 21:29:47 - INFO - __main__ - Step 1583: {'lr': 0.0003955, 'samples': 303936, 'steps': 1582, 'loss/train': 3.0408103466033936} +11/06/2021 21:29:47 - INFO - __main__ - Step 1584: {'lr': 0.00039575, 'samples': 304128, 'steps': 1583, 'loss/train': 3.310321807861328} +11/06/2021 21:29:48 - INFO - __main__ - Step 1585: {'lr': 0.00039600000000000003, 'samples': 304320, 'steps': 1584, 'loss/train': 2.9202144145965576} +11/06/2021 21:29:48 - INFO - __main__ - Step 1586: {'lr': 0.00039625, 'samples': 304512, 'steps': 1585, 'loss/train': 3.2440686225891113} +11/06/2021 21:29:49 - INFO - __main__ - Step 1587: {'lr': 0.00039650000000000004, 'samples': 304704, 'steps': 1586, 'loss/train': 3.232225179672241} +11/06/2021 21:29:49 - INFO - __main__ - Step 1588: {'lr': 0.00039675, 'samples': 304896, 'steps': 1587, 'loss/train': 3.2099974155426025} +11/06/2021 21:29:50 - INFO - __main__ - Step 1589: {'lr': 0.00039700000000000005, 'samples': 305088, 'steps': 1588, 'loss/train': 2.729403018951416} +11/06/2021 21:29:50 - INFO - __main__ - Step 1590: {'lr': 0.00039725, 'samples': 305280, 'steps': 1589, 'loss/train': 2.7173776626586914} +11/06/2021 21:29:50 - INFO - __main__ - Step 1591: {'lr': 0.0003975, 'samples': 305472, 'steps': 1590, 'loss/train': 3.206320285797119} +11/06/2021 21:29:51 - INFO - __main__ - Step 1592: {'lr': 0.00039775, 'samples': 305664, 'steps': 1591, 'loss/train': 2.313783884048462} +11/06/2021 21:29:52 - INFO - __main__ - Step 1593: {'lr': 0.000398, 'samples': 305856, 'steps': 1592, 'loss/train': 3.254606008529663} +11/06/2021 21:29:52 - INFO - __main__ - Step 1594: {'lr': 0.00039825, 'samples': 306048, 'steps': 1593, 'loss/train': 3.374396324157715} +11/06/2021 21:29:52 - INFO - __main__ - Step 1595: {'lr': 0.00039850000000000004, 'samples': 306240, 'steps': 1594, 'loss/train': 3.533506155014038} +11/06/2021 21:29:53 - INFO - __main__ - Step 1596: {'lr': 0.00039875, 'samples': 306432, 'steps': 1595, 'loss/train': 2.543515205383301} +11/06/2021 21:29:54 - INFO - __main__ - Step 1597: {'lr': 0.00039900000000000005, 'samples': 306624, 'steps': 1596, 'loss/train': 2.980104684829712} +11/06/2021 21:29:54 - INFO - __main__ - Step 1598: {'lr': 0.00039925000000000003, 'samples': 306816, 'steps': 1597, 'loss/train': 2.649993896484375} +11/06/2021 21:29:55 - INFO - __main__ - Step 1599: {'lr': 0.0003995, 'samples': 307008, 'steps': 1598, 'loss/train': 2.8795385360717773} +11/06/2021 21:29:55 - INFO - __main__ - Step 1600: {'lr': 0.00039975, 'samples': 307200, 'steps': 1599, 'loss/train': 3.1416678428649902} +11/06/2021 21:29:55 - INFO - __main__ - Step 1601: {'lr': 0.0004, 'samples': 307392, 'steps': 1600, 'loss/train': 2.955704689025879} +11/06/2021 21:29:56 - INFO - __main__ - Step 1602: {'lr': 0.00040025, 'samples': 307584, 'steps': 1601, 'loss/train': 3.7033560276031494} +11/06/2021 21:29:57 - INFO - __main__ - Step 1603: {'lr': 0.00040050000000000003, 'samples': 307776, 'steps': 1602, 'loss/train': 2.7389466762542725} +11/06/2021 21:29:57 - INFO - __main__ - Step 1604: {'lr': 0.00040075, 'samples': 307968, 'steps': 1603, 'loss/train': 3.5183396339416504} +11/06/2021 21:29:58 - INFO - __main__ - Step 1605: {'lr': 0.00040100000000000004, 'samples': 308160, 'steps': 1604, 'loss/train': 3.134627103805542} +11/06/2021 21:29:58 - INFO - __main__ - Step 1606: {'lr': 0.00040125, 'samples': 308352, 'steps': 1605, 'loss/train': 2.952859878540039} +11/06/2021 21:29:58 - INFO - __main__ - Step 1607: {'lr': 0.00040150000000000006, 'samples': 308544, 'steps': 1606, 'loss/train': 3.224421977996826} +11/06/2021 21:29:59 - INFO - __main__ - Step 1608: {'lr': 0.00040175, 'samples': 308736, 'steps': 1607, 'loss/train': 2.4461114406585693} +11/06/2021 21:30:00 - INFO - __main__ - Step 1609: {'lr': 0.000402, 'samples': 308928, 'steps': 1608, 'loss/train': 3.342259645462036} +11/06/2021 21:30:00 - INFO - __main__ - Step 1610: {'lr': 0.00040225, 'samples': 309120, 'steps': 1609, 'loss/train': 3.2026968002319336} +11/06/2021 21:30:00 - INFO - __main__ - Step 1611: {'lr': 0.0004025, 'samples': 309312, 'steps': 1610, 'loss/train': 3.4691827297210693} +11/06/2021 21:30:01 - INFO - __main__ - Step 1612: {'lr': 0.00040275, 'samples': 309504, 'steps': 1611, 'loss/train': 3.279484987258911} +11/06/2021 21:30:02 - INFO - __main__ - Step 1613: {'lr': 0.00040300000000000004, 'samples': 309696, 'steps': 1612, 'loss/train': 3.016733407974243} +11/06/2021 21:30:02 - INFO - __main__ - Step 1614: {'lr': 0.00040325, 'samples': 309888, 'steps': 1613, 'loss/train': 3.192936897277832} +11/06/2021 21:30:02 - INFO - __main__ - Step 1615: {'lr': 0.00040350000000000005, 'samples': 310080, 'steps': 1614, 'loss/train': 3.0827951431274414} +11/06/2021 21:30:03 - INFO - __main__ - Step 1616: {'lr': 0.00040375000000000003, 'samples': 310272, 'steps': 1615, 'loss/train': 2.6593739986419678} +11/06/2021 21:30:03 - INFO - __main__ - Step 1617: {'lr': 0.000404, 'samples': 310464, 'steps': 1616, 'loss/train': 2.6806726455688477} +11/06/2021 21:30:04 - INFO - __main__ - Step 1618: {'lr': 0.00040425, 'samples': 310656, 'steps': 1617, 'loss/train': 2.476854085922241} +11/06/2021 21:30:04 - INFO - __main__ - Step 1619: {'lr': 0.0004045, 'samples': 310848, 'steps': 1618, 'loss/train': 3.110135793685913} +11/06/2021 21:30:05 - INFO - __main__ - Step 1620: {'lr': 0.00040475, 'samples': 311040, 'steps': 1619, 'loss/train': 2.908262014389038} +11/06/2021 21:30:05 - INFO - __main__ - Step 1621: {'lr': 0.00040500000000000003, 'samples': 311232, 'steps': 1620, 'loss/train': 3.027345657348633} +11/06/2021 21:30:05 - INFO - __main__ - Step 1622: {'lr': 0.00040525, 'samples': 311424, 'steps': 1621, 'loss/train': 3.2688331604003906} +11/06/2021 21:30:07 - INFO - __main__ - Step 1623: {'lr': 0.00040550000000000004, 'samples': 311616, 'steps': 1622, 'loss/train': 2.6070456504821777} +11/06/2021 21:30:07 - INFO - __main__ - Step 1624: {'lr': 0.00040575, 'samples': 311808, 'steps': 1623, 'loss/train': 3.40415620803833} +11/06/2021 21:30:07 - INFO - __main__ - Step 1625: {'lr': 0.00040600000000000006, 'samples': 312000, 'steps': 1624, 'loss/train': 3.013209819793701} +11/06/2021 21:30:08 - INFO - __main__ - Step 1626: {'lr': 0.00040625000000000004, 'samples': 312192, 'steps': 1625, 'loss/train': 2.7747411727905273} +11/06/2021 21:30:08 - INFO - __main__ - Step 1627: {'lr': 0.00040649999999999996, 'samples': 312384, 'steps': 1626, 'loss/train': 2.614873170852661} +11/06/2021 21:30:09 - INFO - __main__ - Step 1628: {'lr': 0.00040675, 'samples': 312576, 'steps': 1627, 'loss/train': 2.9833312034606934} +11/06/2021 21:30:09 - INFO - __main__ - Step 1629: {'lr': 0.00040699999999999997, 'samples': 312768, 'steps': 1628, 'loss/train': 3.6013989448547363} +11/06/2021 21:30:10 - INFO - __main__ - Step 1630: {'lr': 0.00040725, 'samples': 312960, 'steps': 1629, 'loss/train': 3.32792067527771} +11/06/2021 21:30:10 - INFO - __main__ - Step 1631: {'lr': 0.0004075, 'samples': 313152, 'steps': 1630, 'loss/train': 2.2372703552246094} +11/06/2021 21:30:10 - INFO - __main__ - Step 1632: {'lr': 0.00040775, 'samples': 313344, 'steps': 1631, 'loss/train': 3.2227723598480225} +11/06/2021 21:30:11 - INFO - __main__ - Step 1633: {'lr': 0.000408, 'samples': 313536, 'steps': 1632, 'loss/train': 2.9736287593841553} +11/06/2021 21:30:12 - INFO - __main__ - Step 1634: {'lr': 0.00040825000000000003, 'samples': 313728, 'steps': 1633, 'loss/train': 3.227055072784424} +11/06/2021 21:30:12 - INFO - __main__ - Step 1635: {'lr': 0.0004085, 'samples': 313920, 'steps': 1634, 'loss/train': 4.195490837097168} +11/06/2021 21:30:13 - INFO - __main__ - Step 1636: {'lr': 0.00040875, 'samples': 314112, 'steps': 1635, 'loss/train': 2.5357518196105957} +11/06/2021 21:30:13 - INFO - __main__ - Step 1637: {'lr': 0.00040899999999999997, 'samples': 314304, 'steps': 1636, 'loss/train': 3.0355074405670166} +11/06/2021 21:30:13 - INFO - __main__ - Step 1638: {'lr': 0.00040925, 'samples': 314496, 'steps': 1637, 'loss/train': 3.301243305206299} +11/06/2021 21:30:14 - INFO - __main__ - Step 1639: {'lr': 0.0004095, 'samples': 314688, 'steps': 1638, 'loss/train': 3.4538841247558594} +11/06/2021 21:30:15 - INFO - __main__ - Step 1640: {'lr': 0.00040975, 'samples': 314880, 'steps': 1639, 'loss/train': 3.0793862342834473} +11/06/2021 21:30:15 - INFO - __main__ - Step 1641: {'lr': 0.00041, 'samples': 315072, 'steps': 1640, 'loss/train': 3.042006492614746} +11/06/2021 21:30:15 - INFO - __main__ - Step 1642: {'lr': 0.00041025, 'samples': 315264, 'steps': 1641, 'loss/train': 2.085822105407715} +11/06/2021 21:30:16 - INFO - __main__ - Step 1643: {'lr': 0.0004105, 'samples': 315456, 'steps': 1642, 'loss/train': 3.430644989013672} +11/06/2021 21:30:17 - INFO - __main__ - Step 1644: {'lr': 0.00041075000000000004, 'samples': 315648, 'steps': 1643, 'loss/train': 2.801948308944702} +11/06/2021 21:30:17 - INFO - __main__ - Step 1645: {'lr': 0.00041099999999999996, 'samples': 315840, 'steps': 1644, 'loss/train': 2.5270915031433105} +11/06/2021 21:30:18 - INFO - __main__ - Step 1646: {'lr': 0.00041125, 'samples': 316032, 'steps': 1645, 'loss/train': 2.423734188079834} +11/06/2021 21:30:18 - INFO - __main__ - Step 1647: {'lr': 0.0004115, 'samples': 316224, 'steps': 1646, 'loss/train': 3.113656520843506} +11/06/2021 21:30:18 - INFO - __main__ - Step 1648: {'lr': 0.00041175, 'samples': 316416, 'steps': 1647, 'loss/train': 3.738720655441284} +11/06/2021 21:30:19 - INFO - __main__ - Step 1649: {'lr': 0.000412, 'samples': 316608, 'steps': 1648, 'loss/train': 3.3871734142303467} +11/06/2021 21:30:20 - INFO - __main__ - Step 1650: {'lr': 0.00041225, 'samples': 316800, 'steps': 1649, 'loss/train': 3.1259071826934814} +11/06/2021 21:30:20 - INFO - __main__ - Step 1651: {'lr': 0.0004125, 'samples': 316992, 'steps': 1650, 'loss/train': 2.9349560737609863} +11/06/2021 21:30:21 - INFO - __main__ - Step 1652: {'lr': 0.00041275000000000003, 'samples': 317184, 'steps': 1651, 'loss/train': 2.337951183319092} +11/06/2021 21:30:21 - INFO - __main__ - Step 1653: {'lr': 0.000413, 'samples': 317376, 'steps': 1652, 'loss/train': 3.269364595413208} +11/06/2021 21:30:21 - INFO - __main__ - Step 1654: {'lr': 0.00041325, 'samples': 317568, 'steps': 1653, 'loss/train': 2.937201499938965} +11/06/2021 21:30:22 - INFO - __main__ - Step 1655: {'lr': 0.00041349999999999997, 'samples': 317760, 'steps': 1654, 'loss/train': 3.1462650299072266} +11/06/2021 21:30:23 - INFO - __main__ - Step 1656: {'lr': 0.00041375, 'samples': 317952, 'steps': 1655, 'loss/train': 3.218020439147949} +11/06/2021 21:30:23 - INFO - __main__ - Step 1657: {'lr': 0.000414, 'samples': 318144, 'steps': 1656, 'loss/train': 2.919787645339966} +11/06/2021 21:30:23 - INFO - __main__ - Step 1658: {'lr': 0.00041425, 'samples': 318336, 'steps': 1657, 'loss/train': 2.882232666015625} +11/06/2021 21:30:24 - INFO - __main__ - Step 1659: {'lr': 0.0004145, 'samples': 318528, 'steps': 1658, 'loss/train': 3.018845558166504} +11/06/2021 21:30:24 - INFO - __main__ - Step 1660: {'lr': 0.00041475, 'samples': 318720, 'steps': 1659, 'loss/train': 3.1834557056427} +11/06/2021 21:30:25 - INFO - __main__ - Step 1661: {'lr': 0.000415, 'samples': 318912, 'steps': 1660, 'loss/train': 2.9305548667907715} +11/06/2021 21:30:26 - INFO - __main__ - Step 1662: {'lr': 0.00041525000000000004, 'samples': 319104, 'steps': 1661, 'loss/train': 2.6207032203674316} +11/06/2021 21:30:26 - INFO - __main__ - Step 1663: {'lr': 0.00041549999999999996, 'samples': 319296, 'steps': 1662, 'loss/train': 2.4517478942871094} +11/06/2021 21:30:26 - INFO - __main__ - Step 1664: {'lr': 0.00041575, 'samples': 319488, 'steps': 1663, 'loss/train': 3.7537591457366943} +11/06/2021 21:30:27 - INFO - __main__ - Step 1665: {'lr': 0.000416, 'samples': 319680, 'steps': 1664, 'loss/train': 2.756814956665039} +11/06/2021 21:30:28 - INFO - __main__ - Step 1666: {'lr': 0.00041625, 'samples': 319872, 'steps': 1665, 'loss/train': 1.4056485891342163} +11/06/2021 21:30:28 - INFO - __main__ - Step 1667: {'lr': 0.0004165, 'samples': 320064, 'steps': 1666, 'loss/train': 3.1112024784088135} +11/06/2021 21:30:29 - INFO - __main__ - Step 1668: {'lr': 0.00041675, 'samples': 320256, 'steps': 1667, 'loss/train': 2.9976048469543457} +11/06/2021 21:30:29 - INFO - __main__ - Step 1669: {'lr': 0.000417, 'samples': 320448, 'steps': 1668, 'loss/train': 2.675729274749756} +11/06/2021 21:30:29 - INFO - __main__ - Step 1670: {'lr': 0.00041725000000000003, 'samples': 320640, 'steps': 1669, 'loss/train': 3.3706750869750977} +11/06/2021 21:30:30 - INFO - __main__ - Step 1671: {'lr': 0.0004175, 'samples': 320832, 'steps': 1670, 'loss/train': 2.178697109222412} +11/06/2021 21:30:31 - INFO - __main__ - Step 1672: {'lr': 0.00041775000000000004, 'samples': 321024, 'steps': 1671, 'loss/train': 3.380084753036499} +11/06/2021 21:30:31 - INFO - __main__ - Step 1673: {'lr': 0.00041799999999999997, 'samples': 321216, 'steps': 1672, 'loss/train': 3.366750717163086} +11/06/2021 21:30:31 - INFO - __main__ - Step 1674: {'lr': 0.00041825, 'samples': 321408, 'steps': 1673, 'loss/train': 3.209273338317871} +11/06/2021 21:30:32 - INFO - __main__ - Step 1675: {'lr': 0.0004185, 'samples': 321600, 'steps': 1674, 'loss/train': 2.97452449798584} +11/06/2021 21:30:32 - INFO - __main__ - Step 1676: {'lr': 0.00041875, 'samples': 321792, 'steps': 1675, 'loss/train': 2.767279863357544} +11/06/2021 21:30:33 - INFO - __main__ - Step 1677: {'lr': 0.000419, 'samples': 321984, 'steps': 1676, 'loss/train': 2.001840114593506} +11/06/2021 21:30:34 - INFO - __main__ - Step 1678: {'lr': 0.00041925, 'samples': 322176, 'steps': 1677, 'loss/train': 2.869393825531006} +11/06/2021 21:30:34 - INFO - __main__ - Step 1679: {'lr': 0.0004195, 'samples': 322368, 'steps': 1678, 'loss/train': 3.0054664611816406} +11/06/2021 21:30:34 - INFO - __main__ - Step 1680: {'lr': 0.00041975000000000004, 'samples': 322560, 'steps': 1679, 'loss/train': 3.0030410289764404} +11/06/2021 21:30:35 - INFO - __main__ - Step 1681: {'lr': 0.00042, 'samples': 322752, 'steps': 1680, 'loss/train': 3.1293513774871826} +11/06/2021 21:30:36 - INFO - __main__ - Step 1682: {'lr': 0.00042025, 'samples': 322944, 'steps': 1681, 'loss/train': 2.867621421813965} +11/06/2021 21:30:36 - INFO - __main__ - Step 1683: {'lr': 0.0004205, 'samples': 323136, 'steps': 1682, 'loss/train': 3.148564100265503} +11/06/2021 21:30:36 - INFO - __main__ - Step 1684: {'lr': 0.00042075, 'samples': 323328, 'steps': 1683, 'loss/train': 3.7352867126464844} +11/06/2021 21:30:37 - INFO - __main__ - Step 1685: {'lr': 0.000421, 'samples': 323520, 'steps': 1684, 'loss/train': 2.9373221397399902} +11/06/2021 21:30:37 - INFO - __main__ - Step 1686: {'lr': 0.00042125, 'samples': 323712, 'steps': 1685, 'loss/train': 3.0616962909698486} +11/06/2021 21:30:38 - INFO - __main__ - Step 1687: {'lr': 0.0004215, 'samples': 323904, 'steps': 1686, 'loss/train': 3.012714147567749} +11/06/2021 21:30:38 - INFO - __main__ - Step 1688: {'lr': 0.00042175000000000003, 'samples': 324096, 'steps': 1687, 'loss/train': 2.1148290634155273} +11/06/2021 21:30:39 - INFO - __main__ - Step 1689: {'lr': 0.000422, 'samples': 324288, 'steps': 1688, 'loss/train': 2.7919063568115234} +11/06/2021 21:30:39 - INFO - __main__ - Step 1690: {'lr': 0.00042225000000000005, 'samples': 324480, 'steps': 1689, 'loss/train': 2.9707889556884766} +11/06/2021 21:30:39 - INFO - __main__ - Step 1691: {'lr': 0.00042249999999999997, 'samples': 324672, 'steps': 1690, 'loss/train': 2.998028039932251} +11/06/2021 21:30:40 - INFO - __main__ - Step 1692: {'lr': 0.00042275, 'samples': 324864, 'steps': 1691, 'loss/train': 2.591597557067871} +11/06/2021 21:30:41 - INFO - __main__ - Step 1693: {'lr': 0.000423, 'samples': 325056, 'steps': 1692, 'loss/train': 1.9363735914230347} +11/06/2021 21:30:41 - INFO - __main__ - Step 1694: {'lr': 0.00042325, 'samples': 325248, 'steps': 1693, 'loss/train': 4.028586387634277} +11/06/2021 21:30:42 - INFO - __main__ - Step 1695: {'lr': 0.0004235, 'samples': 325440, 'steps': 1694, 'loss/train': 2.9330668449401855} +11/06/2021 21:30:42 - INFO - __main__ - Step 1696: {'lr': 0.00042375000000000003, 'samples': 325632, 'steps': 1695, 'loss/train': 2.7509193420410156} +11/06/2021 21:30:42 - INFO - __main__ - Step 1697: {'lr': 0.000424, 'samples': 325824, 'steps': 1696, 'loss/train': 2.7954797744750977} +11/06/2021 21:30:44 - INFO - __main__ - Step 1698: {'lr': 0.00042425000000000004, 'samples': 326016, 'steps': 1697, 'loss/train': 2.988008499145508} +11/06/2021 21:30:44 - INFO - __main__ - Step 1699: {'lr': 0.0004245, 'samples': 326208, 'steps': 1698, 'loss/train': 1.511644959449768} +11/06/2021 21:30:44 - INFO - __main__ - Step 1700: {'lr': 0.00042475000000000005, 'samples': 326400, 'steps': 1699, 'loss/train': 2.778535842895508} +11/06/2021 21:30:45 - INFO - __main__ - Step 1701: {'lr': 0.000425, 'samples': 326592, 'steps': 1700, 'loss/train': 3.4467451572418213} +11/06/2021 21:30:45 - INFO - __main__ - Step 1702: {'lr': 0.00042525, 'samples': 326784, 'steps': 1701, 'loss/train': 2.888021469116211} +11/06/2021 21:30:46 - INFO - __main__ - Step 1703: {'lr': 0.0004255, 'samples': 326976, 'steps': 1702, 'loss/train': 3.509974718093872} +11/06/2021 21:30:46 - INFO - __main__ - Step 1704: {'lr': 0.00042575, 'samples': 327168, 'steps': 1703, 'loss/train': 3.2961580753326416} +11/06/2021 21:30:47 - INFO - __main__ - Step 1705: {'lr': 0.000426, 'samples': 327360, 'steps': 1704, 'loss/train': 2.881072521209717} +11/06/2021 21:30:47 - INFO - __main__ - Step 1706: {'lr': 0.00042625000000000003, 'samples': 327552, 'steps': 1705, 'loss/train': 2.8724474906921387} +11/06/2021 21:30:48 - INFO - __main__ - Step 1707: {'lr': 0.0004265, 'samples': 327744, 'steps': 1706, 'loss/train': 2.812833547592163} +11/06/2021 21:30:49 - INFO - __main__ - Step 1708: {'lr': 0.00042675000000000005, 'samples': 327936, 'steps': 1707, 'loss/train': 2.946378231048584} +11/06/2021 21:30:49 - INFO - __main__ - Step 1709: {'lr': 0.000427, 'samples': 328128, 'steps': 1708, 'loss/train': 3.0991225242614746} +11/06/2021 21:30:49 - INFO - __main__ - Step 1710: {'lr': 0.00042725, 'samples': 328320, 'steps': 1709, 'loss/train': 2.76066517829895} +11/06/2021 21:30:50 - INFO - __main__ - Step 1711: {'lr': 0.0004275, 'samples': 328512, 'steps': 1710, 'loss/train': 3.4125115871429443} +11/06/2021 21:30:50 - INFO - __main__ - Step 1712: {'lr': 0.00042775, 'samples': 328704, 'steps': 1711, 'loss/train': 3.148629903793335} +11/06/2021 21:30:51 - INFO - __main__ - Step 1713: {'lr': 0.000428, 'samples': 328896, 'steps': 1712, 'loss/train': 2.9542479515075684} +11/06/2021 21:30:51 - INFO - __main__ - Step 1714: {'lr': 0.00042825000000000003, 'samples': 329088, 'steps': 1713, 'loss/train': 2.862802743911743} +11/06/2021 21:30:52 - INFO - __main__ - Step 1715: {'lr': 0.0004285, 'samples': 329280, 'steps': 1714, 'loss/train': 3.073770046234131} +11/06/2021 21:30:52 - INFO - __main__ - Step 1716: {'lr': 0.00042875000000000004, 'samples': 329472, 'steps': 1715, 'loss/train': 3.261838436126709} +11/06/2021 21:30:52 - INFO - __main__ - Step 1717: {'lr': 0.000429, 'samples': 329664, 'steps': 1716, 'loss/train': 2.599968194961548} +11/06/2021 21:30:53 - INFO - __main__ - Step 1718: {'lr': 0.00042925000000000005, 'samples': 329856, 'steps': 1717, 'loss/train': 2.516638994216919} +11/06/2021 21:30:54 - INFO - __main__ - Step 1719: {'lr': 0.0004295, 'samples': 330048, 'steps': 1718, 'loss/train': 3.0501821041107178} +11/06/2021 21:30:54 - INFO - __main__ - Step 1720: {'lr': 0.00042975, 'samples': 330240, 'steps': 1719, 'loss/train': 2.847111225128174} +11/06/2021 21:30:55 - INFO - __main__ - Step 1721: {'lr': 0.00043, 'samples': 330432, 'steps': 1720, 'loss/train': 3.3006772994995117} +11/06/2021 21:30:55 - INFO - __main__ - Step 1722: {'lr': 0.00043025, 'samples': 330624, 'steps': 1721, 'loss/train': 2.7652220726013184} +11/06/2021 21:30:55 - INFO - __main__ - Step 1723: {'lr': 0.0004305, 'samples': 330816, 'steps': 1722, 'loss/train': 2.9833667278289795} +11/06/2021 21:30:56 - INFO - __main__ - Step 1724: {'lr': 0.00043075000000000003, 'samples': 331008, 'steps': 1723, 'loss/train': 2.814836263656616} +11/06/2021 21:30:57 - INFO - __main__ - Step 1725: {'lr': 0.000431, 'samples': 331200, 'steps': 1724, 'loss/train': 2.774881601333618} +11/06/2021 21:30:57 - INFO - __main__ - Step 1726: {'lr': 0.00043125000000000005, 'samples': 331392, 'steps': 1725, 'loss/train': 2.4785728454589844} +11/06/2021 21:30:57 - INFO - __main__ - Step 1727: {'lr': 0.0004315, 'samples': 331584, 'steps': 1726, 'loss/train': 2.6767044067382812} +11/06/2021 21:30:58 - INFO - __main__ - Step 1728: {'lr': 0.00043175, 'samples': 331776, 'steps': 1727, 'loss/train': 2.493360757827759} +11/06/2021 21:30:59 - INFO - __main__ - Step 1729: {'lr': 0.000432, 'samples': 331968, 'steps': 1728, 'loss/train': 2.8869781494140625} +11/06/2021 21:30:59 - INFO - __main__ - Step 1730: {'lr': 0.00043225, 'samples': 332160, 'steps': 1729, 'loss/train': 3.2163848876953125} +11/06/2021 21:30:59 - INFO - __main__ - Step 1731: {'lr': 0.0004325, 'samples': 332352, 'steps': 1730, 'loss/train': 2.487175703048706} +11/06/2021 21:31:00 - INFO - __main__ - Step 1732: {'lr': 0.00043275000000000003, 'samples': 332544, 'steps': 1731, 'loss/train': 3.1521098613739014} +11/06/2021 21:31:00 - INFO - __main__ - Step 1733: {'lr': 0.000433, 'samples': 332736, 'steps': 1732, 'loss/train': 2.8074662685394287} +11/06/2021 21:31:01 - INFO - __main__ - Step 1734: {'lr': 0.00043325000000000004, 'samples': 332928, 'steps': 1733, 'loss/train': 3.05580735206604} +11/06/2021 21:31:01 - INFO - __main__ - Step 1735: {'lr': 0.0004335, 'samples': 333120, 'steps': 1734, 'loss/train': 3.6109087467193604} +11/06/2021 21:31:02 - INFO - __main__ - Step 1736: {'lr': 0.00043375000000000005, 'samples': 333312, 'steps': 1735, 'loss/train': 2.645113945007324} +11/06/2021 21:31:02 - INFO - __main__ - Step 1737: {'lr': 0.00043400000000000003, 'samples': 333504, 'steps': 1736, 'loss/train': 3.2458112239837646} +11/06/2021 21:31:02 - INFO - __main__ - Step 1738: {'lr': 0.00043425, 'samples': 333696, 'steps': 1737, 'loss/train': 2.0575199127197266} +11/06/2021 21:31:03 - INFO - __main__ - Step 1739: {'lr': 0.0004345, 'samples': 333888, 'steps': 1738, 'loss/train': 2.66829514503479} +11/06/2021 21:31:04 - INFO - __main__ - Step 1740: {'lr': 0.00043475, 'samples': 334080, 'steps': 1739, 'loss/train': 2.9333367347717285} +11/06/2021 21:31:04 - INFO - __main__ - Step 1741: {'lr': 0.000435, 'samples': 334272, 'steps': 1740, 'loss/train': 3.1755714416503906} +11/06/2021 21:31:04 - INFO - __main__ - Step 1742: {'lr': 0.00043525000000000004, 'samples': 334464, 'steps': 1741, 'loss/train': 3.1603219509124756} +11/06/2021 21:31:05 - INFO - __main__ - Step 1743: {'lr': 0.0004355, 'samples': 334656, 'steps': 1742, 'loss/train': 2.6941590309143066} +11/06/2021 21:31:05 - INFO - __main__ - Step 1744: {'lr': 0.00043575000000000005, 'samples': 334848, 'steps': 1743, 'loss/train': 2.652301788330078} +11/06/2021 21:31:06 - INFO - __main__ - Step 1745: {'lr': 0.000436, 'samples': 335040, 'steps': 1744, 'loss/train': 2.9104788303375244} +11/06/2021 21:31:06 - INFO - __main__ - Step 1746: {'lr': 0.00043625000000000006, 'samples': 335232, 'steps': 1745, 'loss/train': 2.98048996925354} +11/06/2021 21:31:07 - INFO - __main__ - Step 1747: {'lr': 0.0004365, 'samples': 335424, 'steps': 1746, 'loss/train': 2.9957258701324463} +11/06/2021 21:31:07 - INFO - __main__ - Step 1748: {'lr': 0.00043675, 'samples': 335616, 'steps': 1747, 'loss/train': 2.979066848754883} +11/06/2021 21:31:08 - INFO - __main__ - Step 1749: {'lr': 0.000437, 'samples': 335808, 'steps': 1748, 'loss/train': 2.8784215450286865} +11/06/2021 21:31:09 - INFO - __main__ - Step 1750: {'lr': 0.00043725000000000003, 'samples': 336000, 'steps': 1749, 'loss/train': 2.7070152759552} +11/06/2021 21:31:09 - INFO - __main__ - Step 1751: {'lr': 0.0004375, 'samples': 336192, 'steps': 1750, 'loss/train': 3.0066816806793213} +11/06/2021 21:31:09 - INFO - __main__ - Step 1752: {'lr': 0.00043775, 'samples': 336384, 'steps': 1751, 'loss/train': 2.9297680854797363} +11/06/2021 21:31:10 - INFO - __main__ - Step 1753: {'lr': 0.000438, 'samples': 336576, 'steps': 1752, 'loss/train': 2.3090498447418213} +11/06/2021 21:31:10 - INFO - __main__ - Step 1754: {'lr': 0.00043825, 'samples': 336768, 'steps': 1753, 'loss/train': 2.7136483192443848} +11/06/2021 21:31:11 - INFO - __main__ - Step 1755: {'lr': 0.00043850000000000003, 'samples': 336960, 'steps': 1754, 'loss/train': 2.4475595951080322} +11/06/2021 21:31:11 - INFO - __main__ - Step 1756: {'lr': 0.00043874999999999996, 'samples': 337152, 'steps': 1755, 'loss/train': 2.8239781856536865} +11/06/2021 21:31:12 - INFO - __main__ - Step 1757: {'lr': 0.000439, 'samples': 337344, 'steps': 1756, 'loss/train': 3.583254337310791} +11/06/2021 21:31:12 - INFO - __main__ - Step 1758: {'lr': 0.00043924999999999997, 'samples': 337536, 'steps': 1757, 'loss/train': 2.8755791187286377} +11/06/2021 21:31:12 - INFO - __main__ - Step 1759: {'lr': 0.0004395, 'samples': 337728, 'steps': 1758, 'loss/train': 2.466693878173828} +11/06/2021 21:31:14 - INFO - __main__ - Step 1760: {'lr': 0.00043975, 'samples': 337920, 'steps': 1759, 'loss/train': 1.9713040590286255} +11/06/2021 21:31:14 - INFO - __main__ - Step 1761: {'lr': 0.00044, 'samples': 338112, 'steps': 1760, 'loss/train': 2.958988904953003} +11/06/2021 21:31:14 - INFO - __main__ - Step 1762: {'lr': 0.00044025, 'samples': 338304, 'steps': 1761, 'loss/train': 2.85742449760437} +11/06/2021 21:31:15 - INFO - __main__ - Step 1763: {'lr': 0.00044050000000000003, 'samples': 338496, 'steps': 1762, 'loss/train': 3.1893415451049805} +11/06/2021 21:31:15 - INFO - __main__ - Step 1764: {'lr': 0.00044075, 'samples': 338688, 'steps': 1763, 'loss/train': 2.489380121231079} +11/06/2021 21:31:16 - INFO - __main__ - Step 1765: {'lr': 0.000441, 'samples': 338880, 'steps': 1764, 'loss/train': 2.26016902923584} +11/06/2021 21:31:16 - INFO - __main__ - Step 1766: {'lr': 0.00044124999999999996, 'samples': 339072, 'steps': 1765, 'loss/train': 2.8823275566101074} +11/06/2021 21:31:17 - INFO - __main__ - Step 1767: {'lr': 0.0004415, 'samples': 339264, 'steps': 1766, 'loss/train': 3.0336639881134033} +11/06/2021 21:31:17 - INFO - __main__ - Step 1768: {'lr': 0.00044175, 'samples': 339456, 'steps': 1767, 'loss/train': 2.4429008960723877} +11/06/2021 21:31:17 - INFO - __main__ - Step 1769: {'lr': 0.000442, 'samples': 339648, 'steps': 1768, 'loss/train': 3.196798086166382} +11/06/2021 21:31:18 - INFO - __main__ - Step 1770: {'lr': 0.00044225, 'samples': 339840, 'steps': 1769, 'loss/train': 3.4543304443359375} +11/06/2021 21:31:19 - INFO - __main__ - Step 1771: {'lr': 0.0004425, 'samples': 340032, 'steps': 1770, 'loss/train': 2.851696252822876} +11/06/2021 21:31:19 - INFO - __main__ - Step 1772: {'lr': 0.00044275, 'samples': 340224, 'steps': 1771, 'loss/train': 3.060702085494995} +11/06/2021 21:31:19 - INFO - __main__ - Step 1773: {'lr': 0.00044300000000000003, 'samples': 340416, 'steps': 1772, 'loss/train': 2.7474842071533203} +11/06/2021 21:31:20 - INFO - __main__ - Step 1774: {'lr': 0.00044325, 'samples': 340608, 'steps': 1773, 'loss/train': 2.9190454483032227} +11/06/2021 21:31:21 - INFO - __main__ - Step 1775: {'lr': 0.0004435, 'samples': 340800, 'steps': 1774, 'loss/train': 2.802793025970459} +11/06/2021 21:31:21 - INFO - __main__ - Step 1776: {'lr': 0.00044374999999999997, 'samples': 340992, 'steps': 1775, 'loss/train': 2.8785560131073} +11/06/2021 21:31:21 - INFO - __main__ - Step 1777: {'lr': 0.000444, 'samples': 341184, 'steps': 1776, 'loss/train': 2.995643138885498} +11/06/2021 21:31:22 - INFO - __main__ - Step 1778: {'lr': 0.00044425, 'samples': 341376, 'steps': 1777, 'loss/train': 1.8993228673934937} +11/06/2021 21:31:22 - INFO - __main__ - Step 1779: {'lr': 0.0004445, 'samples': 341568, 'steps': 1778, 'loss/train': 2.85463547706604} +11/06/2021 21:31:23 - INFO - __main__ - Step 1780: {'lr': 0.00044475, 'samples': 341760, 'steps': 1779, 'loss/train': 2.185767650604248} +11/06/2021 21:31:24 - INFO - __main__ - Step 1781: {'lr': 0.00044500000000000003, 'samples': 341952, 'steps': 1780, 'loss/train': 2.92201828956604} +11/06/2021 21:31:24 - INFO - __main__ - Step 1782: {'lr': 0.00044525, 'samples': 342144, 'steps': 1781, 'loss/train': 3.134248971939087} +11/06/2021 21:31:24 - INFO - __main__ - Step 1783: {'lr': 0.00044550000000000004, 'samples': 342336, 'steps': 1782, 'loss/train': 2.170048952102661} +11/06/2021 21:31:25 - INFO - __main__ - Step 1784: {'lr': 0.00044574999999999997, 'samples': 342528, 'steps': 1783, 'loss/train': 3.8918814659118652} +11/06/2021 21:31:26 - INFO - __main__ - Step 1785: {'lr': 0.000446, 'samples': 342720, 'steps': 1784, 'loss/train': 2.8046724796295166} +11/06/2021 21:31:26 - INFO - __main__ - Step 1786: {'lr': 0.00044625, 'samples': 342912, 'steps': 1785, 'loss/train': 1.7093374729156494} +11/06/2021 21:31:26 - INFO - __main__ - Step 1787: {'lr': 0.0004465, 'samples': 343104, 'steps': 1786, 'loss/train': 2.761946678161621} +11/06/2021 21:31:27 - INFO - __main__ - Step 1788: {'lr': 0.00044675, 'samples': 343296, 'steps': 1787, 'loss/train': 3.1174871921539307} +11/06/2021 21:31:27 - INFO - __main__ - Step 1789: {'lr': 0.000447, 'samples': 343488, 'steps': 1788, 'loss/train': 0.9450645446777344} +11/06/2021 21:31:27 - INFO - __main__ - Step 1790: {'lr': 0.00044725, 'samples': 343680, 'steps': 1789, 'loss/train': 2.685868263244629} +11/06/2021 21:31:28 - INFO - __main__ - Step 1791: {'lr': 0.00044750000000000004, 'samples': 343872, 'steps': 1790, 'loss/train': 3.149627685546875} +11/06/2021 21:31:29 - INFO - __main__ - Step 1792: {'lr': 0.00044775, 'samples': 344064, 'steps': 1791, 'loss/train': 2.8557493686676025} +11/06/2021 21:31:29 - INFO - __main__ - Step 1793: {'lr': 0.000448, 'samples': 344256, 'steps': 1792, 'loss/train': 2.3917579650878906} +11/06/2021 21:31:29 - INFO - __main__ - Step 1794: {'lr': 0.00044824999999999997, 'samples': 344448, 'steps': 1793, 'loss/train': 2.5539019107818604} +11/06/2021 21:31:30 - INFO - __main__ - Step 1795: {'lr': 0.0004485, 'samples': 344640, 'steps': 1794, 'loss/train': 2.866556167602539} +11/06/2021 21:31:31 - INFO - __main__ - Step 1796: {'lr': 0.00044875, 'samples': 344832, 'steps': 1795, 'loss/train': 2.69342303276062} +11/06/2021 21:31:31 - INFO - __main__ - Step 1797: {'lr': 0.000449, 'samples': 345024, 'steps': 1796, 'loss/train': 3.4725310802459717} +11/06/2021 21:31:32 - INFO - __main__ - Step 1798: {'lr': 0.00044925, 'samples': 345216, 'steps': 1797, 'loss/train': 3.1553845405578613} +11/06/2021 21:31:32 - INFO - __main__ - Step 1799: {'lr': 0.00044950000000000003, 'samples': 345408, 'steps': 1798, 'loss/train': 2.5512850284576416} +11/06/2021 21:31:32 - INFO - __main__ - Step 1800: {'lr': 0.00044975, 'samples': 345600, 'steps': 1799, 'loss/train': 2.6328558921813965} +11/06/2021 21:31:33 - INFO - __main__ - Step 1801: {'lr': 0.00045000000000000004, 'samples': 345792, 'steps': 1800, 'loss/train': 2.415855646133423} +11/06/2021 21:31:34 - INFO - __main__ - Step 1802: {'lr': 0.00045024999999999997, 'samples': 345984, 'steps': 1801, 'loss/train': 2.065478801727295} +11/06/2021 21:31:34 - INFO - __main__ - Step 1803: {'lr': 0.0004505, 'samples': 346176, 'steps': 1802, 'loss/train': 3.1000237464904785} +11/06/2021 21:31:34 - INFO - __main__ - Step 1804: {'lr': 0.00045075, 'samples': 346368, 'steps': 1803, 'loss/train': 3.079942464828491} +11/06/2021 21:31:35 - INFO - __main__ - Step 1805: {'lr': 0.000451, 'samples': 346560, 'steps': 1804, 'loss/train': 2.9212794303894043} +11/06/2021 21:31:36 - INFO - __main__ - Step 1806: {'lr': 0.00045125, 'samples': 346752, 'steps': 1805, 'loss/train': 2.327099323272705} +11/06/2021 21:31:36 - INFO - __main__ - Step 1807: {'lr': 0.0004515, 'samples': 346944, 'steps': 1806, 'loss/train': 2.2962563037872314} +11/06/2021 21:31:36 - INFO - __main__ - Step 1808: {'lr': 0.00045175, 'samples': 347136, 'steps': 1807, 'loss/train': 2.611140012741089} +11/06/2021 21:31:37 - INFO - __main__ - Step 1809: {'lr': 0.00045200000000000004, 'samples': 347328, 'steps': 1808, 'loss/train': 2.6826744079589844} +11/06/2021 21:31:37 - INFO - __main__ - Step 1810: {'lr': 0.00045225, 'samples': 347520, 'steps': 1809, 'loss/train': 1.936403512954712} +11/06/2021 21:31:38 - INFO - __main__ - Step 1811: {'lr': 0.00045250000000000005, 'samples': 347712, 'steps': 1810, 'loss/train': 2.373436450958252} +11/06/2021 21:31:39 - INFO - __main__ - Step 1812: {'lr': 0.00045275, 'samples': 347904, 'steps': 1811, 'loss/train': 2.730616807937622} +11/06/2021 21:31:39 - INFO - __main__ - Step 1813: {'lr': 0.000453, 'samples': 348096, 'steps': 1812, 'loss/train': 2.415011405944824} +11/06/2021 21:31:39 - INFO - __main__ - Step 1814: {'lr': 0.00045325, 'samples': 348288, 'steps': 1813, 'loss/train': 3.2586300373077393} +11/06/2021 21:31:40 - INFO - __main__ - Step 1815: {'lr': 0.0004535, 'samples': 348480, 'steps': 1814, 'loss/train': 2.568127155303955} +11/06/2021 21:31:40 - INFO - __main__ - Step 1816: {'lr': 0.00045375, 'samples': 348672, 'steps': 1815, 'loss/train': 2.9116480350494385} +11/06/2021 21:31:41 - INFO - __main__ - Step 1817: {'lr': 0.00045400000000000003, 'samples': 348864, 'steps': 1816, 'loss/train': 2.36753249168396} +11/06/2021 21:31:41 - INFO - __main__ - Step 1818: {'lr': 0.00045425, 'samples': 349056, 'steps': 1817, 'loss/train': 1.9278064966201782} +11/06/2021 21:31:42 - INFO - __main__ - Step 1819: {'lr': 0.00045450000000000004, 'samples': 349248, 'steps': 1818, 'loss/train': 3.1639034748077393} +11/06/2021 21:31:42 - INFO - __main__ - Step 1820: {'lr': 0.00045475, 'samples': 349440, 'steps': 1819, 'loss/train': 2.775869846343994} +11/06/2021 21:31:42 - INFO - __main__ - Step 1821: {'lr': 0.000455, 'samples': 349632, 'steps': 1820, 'loss/train': 1.739648699760437} +11/06/2021 21:31:44 - INFO - __main__ - Step 1822: {'lr': 0.00045525, 'samples': 349824, 'steps': 1821, 'loss/train': 2.914762258529663} +11/06/2021 21:31:44 - INFO - __main__ - Step 1823: {'lr': 0.0004555, 'samples': 350016, 'steps': 1822, 'loss/train': 2.881727457046509} +11/06/2021 21:31:44 - INFO - __main__ - Step 1824: {'lr': 0.00045575, 'samples': 350208, 'steps': 1823, 'loss/train': 2.6797189712524414} +11/06/2021 21:31:45 - INFO - __main__ - Step 1825: {'lr': 0.000456, 'samples': 350400, 'steps': 1824, 'loss/train': 3.1673336029052734} +11/06/2021 21:31:45 - INFO - __main__ - Step 1826: {'lr': 0.00045625, 'samples': 350592, 'steps': 1825, 'loss/train': 2.9814321994781494} +11/06/2021 21:31:45 - INFO - __main__ - Step 1827: {'lr': 0.00045650000000000004, 'samples': 350784, 'steps': 1826, 'loss/train': 2.706651210784912} +11/06/2021 21:31:47 - INFO - __main__ - Step 1828: {'lr': 0.00045675, 'samples': 350976, 'steps': 1827, 'loss/train': 2.262235403060913} +11/06/2021 21:31:47 - INFO - __main__ - Step 1829: {'lr': 0.00045700000000000005, 'samples': 351168, 'steps': 1828, 'loss/train': 3.5420644283294678} +11/06/2021 21:31:47 - INFO - __main__ - Step 1830: {'lr': 0.00045725, 'samples': 351360, 'steps': 1829, 'loss/train': 2.597929000854492} +11/06/2021 21:31:48 - INFO - __main__ - Step 1831: {'lr': 0.0004575, 'samples': 351552, 'steps': 1830, 'loss/train': 3.1444313526153564} +11/06/2021 21:31:48 - INFO - __main__ - Step 1832: {'lr': 0.00045775, 'samples': 351744, 'steps': 1831, 'loss/train': 2.755781650543213} +11/06/2021 21:31:49 - INFO - __main__ - Step 1833: {'lr': 0.000458, 'samples': 351936, 'steps': 1832, 'loss/train': 2.7278811931610107} +11/06/2021 21:31:50 - INFO - __main__ - Step 1834: {'lr': 0.00045825, 'samples': 352128, 'steps': 1833, 'loss/train': 3.7509689331054688} +11/06/2021 21:31:50 - INFO - __main__ - Step 1835: {'lr': 0.00045850000000000003, 'samples': 352320, 'steps': 1834, 'loss/train': 2.9152324199676514} +11/06/2021 21:31:50 - INFO - __main__ - Step 1836: {'lr': 0.00045875, 'samples': 352512, 'steps': 1835, 'loss/train': 3.254568338394165} +11/06/2021 21:31:51 - INFO - __main__ - Step 1837: {'lr': 0.00045900000000000004, 'samples': 352704, 'steps': 1836, 'loss/train': 3.5360164642333984} +11/06/2021 21:31:51 - INFO - __main__ - Step 1838: {'lr': 0.00045925, 'samples': 352896, 'steps': 1837, 'loss/train': 2.5410776138305664} +11/06/2021 21:31:52 - INFO - __main__ - Step 1839: {'lr': 0.00045950000000000006, 'samples': 353088, 'steps': 1838, 'loss/train': 3.515568971633911} +11/06/2021 21:31:52 - INFO - __main__ - Step 1840: {'lr': 0.00045975, 'samples': 353280, 'steps': 1839, 'loss/train': 2.9194540977478027} +11/06/2021 21:31:53 - INFO - __main__ - Step 1841: {'lr': 0.00046, 'samples': 353472, 'steps': 1840, 'loss/train': 3.339538335800171} +11/06/2021 21:31:53 - INFO - __main__ - Step 1842: {'lr': 0.00046025, 'samples': 353664, 'steps': 1841, 'loss/train': 3.2247955799102783} +11/06/2021 21:31:53 - INFO - __main__ - Step 1843: {'lr': 0.0004605, 'samples': 353856, 'steps': 1842, 'loss/train': 2.9142487049102783} +11/06/2021 21:31:54 - INFO - __main__ - Step 1844: {'lr': 0.00046075, 'samples': 354048, 'steps': 1843, 'loss/train': 3.003730058670044} +11/06/2021 21:31:55 - INFO - __main__ - Step 1845: {'lr': 0.00046100000000000004, 'samples': 354240, 'steps': 1844, 'loss/train': 2.9719865322113037} +11/06/2021 21:31:55 - INFO - __main__ - Step 1846: {'lr': 0.00046125, 'samples': 354432, 'steps': 1845, 'loss/train': 2.9568333625793457} +11/06/2021 21:31:55 - INFO - __main__ - Step 1847: {'lr': 0.00046150000000000005, 'samples': 354624, 'steps': 1846, 'loss/train': 3.0182647705078125} +11/06/2021 21:31:56 - INFO - __main__ - Step 1848: {'lr': 0.00046175000000000003, 'samples': 354816, 'steps': 1847, 'loss/train': 2.928616762161255} +11/06/2021 21:31:57 - INFO - __main__ - Step 1849: {'lr': 0.000462, 'samples': 355008, 'steps': 1848, 'loss/train': 2.610539674758911} +11/06/2021 21:31:57 - INFO - __main__ - Step 1850: {'lr': 0.00046225, 'samples': 355200, 'steps': 1849, 'loss/train': 2.6568455696105957} +11/06/2021 21:31:57 - INFO - __main__ - Step 1851: {'lr': 0.0004625, 'samples': 355392, 'steps': 1850, 'loss/train': 3.0052649974823} +11/06/2021 21:31:58 - INFO - __main__ - Step 1852: {'lr': 0.00046275, 'samples': 355584, 'steps': 1851, 'loss/train': 2.291944980621338} +11/06/2021 21:31:58 - INFO - __main__ - Step 1853: {'lr': 0.00046300000000000003, 'samples': 355776, 'steps': 1852, 'loss/train': 2.464561700820923} +11/06/2021 21:31:59 - INFO - __main__ - Step 1854: {'lr': 0.00046325, 'samples': 355968, 'steps': 1853, 'loss/train': 2.724757671356201} +11/06/2021 21:32:00 - INFO - __main__ - Step 1855: {'lr': 0.00046350000000000004, 'samples': 356160, 'steps': 1854, 'loss/train': 2.5522210597991943} +11/06/2021 21:32:00 - INFO - __main__ - Step 1856: {'lr': 0.00046375, 'samples': 356352, 'steps': 1855, 'loss/train': 2.9748101234436035} +11/06/2021 21:32:00 - INFO - __main__ - Step 1857: {'lr': 0.00046400000000000006, 'samples': 356544, 'steps': 1856, 'loss/train': 2.8747081756591797} +11/06/2021 21:32:01 - INFO - __main__ - Step 1858: {'lr': 0.00046425, 'samples': 356736, 'steps': 1857, 'loss/train': 3.183314085006714} +11/06/2021 21:32:01 - INFO - __main__ - Step 1859: {'lr': 0.0004645, 'samples': 356928, 'steps': 1858, 'loss/train': 2.9345762729644775} +11/06/2021 21:32:02 - INFO - __main__ - Step 1860: {'lr': 0.00046475, 'samples': 357120, 'steps': 1859, 'loss/train': 2.89750337600708} +11/06/2021 21:32:02 - INFO - __main__ - Step 1861: {'lr': 0.000465, 'samples': 357312, 'steps': 1860, 'loss/train': 2.8957128524780273} +11/06/2021 21:32:03 - INFO - __main__ - Step 1862: {'lr': 0.00046525, 'samples': 357504, 'steps': 1861, 'loss/train': 3.1396281719207764} +11/06/2021 21:32:03 - INFO - __main__ - Step 1863: {'lr': 0.00046550000000000004, 'samples': 357696, 'steps': 1862, 'loss/train': 2.8213651180267334} +11/06/2021 21:32:03 - INFO - __main__ - Step 1864: {'lr': 0.00046575, 'samples': 357888, 'steps': 1863, 'loss/train': 3.4859542846679688} +11/06/2021 21:32:04 - INFO - __main__ - Step 1865: {'lr': 0.00046600000000000005, 'samples': 358080, 'steps': 1864, 'loss/train': 2.8421342372894287} +11/06/2021 21:32:05 - INFO - __main__ - Step 1866: {'lr': 0.00046625000000000003, 'samples': 358272, 'steps': 1865, 'loss/train': 2.0108532905578613} +11/06/2021 21:32:05 - INFO - __main__ - Step 1867: {'lr': 0.0004665, 'samples': 358464, 'steps': 1866, 'loss/train': 3.0010299682617188} +11/06/2021 21:32:05 - INFO - __main__ - Step 1868: {'lr': 0.00046675, 'samples': 358656, 'steps': 1867, 'loss/train': 2.391618013381958} +11/06/2021 21:32:06 - INFO - __main__ - Step 1869: {'lr': 0.000467, 'samples': 358848, 'steps': 1868, 'loss/train': 1.2518956661224365} +11/06/2021 21:32:07 - INFO - __main__ - Step 1870: {'lr': 0.00046725, 'samples': 359040, 'steps': 1869, 'loss/train': 2.0170106887817383} +11/06/2021 21:32:07 - INFO - __main__ - Step 1871: {'lr': 0.00046750000000000003, 'samples': 359232, 'steps': 1870, 'loss/train': 1.179073691368103} +11/06/2021 21:32:08 - INFO - __main__ - Step 1872: {'lr': 0.00046775, 'samples': 359424, 'steps': 1871, 'loss/train': 2.682760715484619} +11/06/2021 21:32:08 - INFO - __main__ - Step 1873: {'lr': 0.00046800000000000005, 'samples': 359616, 'steps': 1872, 'loss/train': 2.571380138397217} +11/06/2021 21:32:08 - INFO - __main__ - Step 1874: {'lr': 0.00046825, 'samples': 359808, 'steps': 1873, 'loss/train': 3.113672971725464} +11/06/2021 21:32:10 - INFO - __main__ - Step 1875: {'lr': 0.00046850000000000006, 'samples': 360000, 'steps': 1874, 'loss/train': 3.40779447555542} +11/06/2021 21:32:10 - INFO - __main__ - Step 1876: {'lr': 0.00046875, 'samples': 360192, 'steps': 1875, 'loss/train': 2.6321020126342773} +11/06/2021 21:32:10 - INFO - __main__ - Step 1877: {'lr': 0.00046899999999999996, 'samples': 360384, 'steps': 1876, 'loss/train': 2.4527957439422607} +11/06/2021 21:32:11 - INFO - __main__ - Step 1878: {'lr': 0.00046925, 'samples': 360576, 'steps': 1877, 'loss/train': 2.8265886306762695} +11/06/2021 21:32:11 - INFO - __main__ - Step 1879: {'lr': 0.0004695, 'samples': 360768, 'steps': 1878, 'loss/train': 2.863210916519165} +11/06/2021 21:32:11 - INFO - __main__ - Step 1880: {'lr': 0.00046975, 'samples': 360960, 'steps': 1879, 'loss/train': 2.7804150581359863} +11/06/2021 21:32:12 - INFO - __main__ - Step 1881: {'lr': 0.00047, 'samples': 361152, 'steps': 1880, 'loss/train': 2.7934844493865967} +11/06/2021 21:32:13 - INFO - __main__ - Step 1882: {'lr': 0.00047025, 'samples': 361344, 'steps': 1881, 'loss/train': 2.5030977725982666} +11/06/2021 21:32:13 - INFO - __main__ - Step 1883: {'lr': 0.0004705, 'samples': 361536, 'steps': 1882, 'loss/train': 2.1091949939727783} +11/06/2021 21:32:13 - INFO - __main__ - Step 1884: {'lr': 0.00047075000000000003, 'samples': 361728, 'steps': 1883, 'loss/train': 2.5549018383026123} +11/06/2021 21:32:14 - INFO - __main__ - Step 1885: {'lr': 0.000471, 'samples': 361920, 'steps': 1884, 'loss/train': 2.7697577476501465} +11/06/2021 21:32:15 - INFO - __main__ - Step 1886: {'lr': 0.00047125, 'samples': 362112, 'steps': 1885, 'loss/train': 2.8604817390441895} +11/06/2021 21:32:15 - INFO - __main__ - Step 1887: {'lr': 0.00047149999999999997, 'samples': 362304, 'steps': 1886, 'loss/train': 2.9714930057525635} +11/06/2021 21:32:16 - INFO - __main__ - Step 1888: {'lr': 0.00047175, 'samples': 362496, 'steps': 1887, 'loss/train': 3.0450122356414795} +11/06/2021 21:32:16 - INFO - __main__ - Step 1889: {'lr': 0.000472, 'samples': 362688, 'steps': 1888, 'loss/train': 2.69807505607605} +11/06/2021 21:32:16 - INFO - __main__ - Step 1890: {'lr': 0.00047225, 'samples': 362880, 'steps': 1889, 'loss/train': 2.992997884750366} +11/06/2021 21:32:17 - INFO - __main__ - Step 1891: {'lr': 0.0004725, 'samples': 363072, 'steps': 1890, 'loss/train': 2.015784740447998} +11/06/2021 21:32:18 - INFO - __main__ - Step 1892: {'lr': 0.00047275, 'samples': 363264, 'steps': 1891, 'loss/train': 2.8816325664520264} +11/06/2021 21:32:18 - INFO - __main__ - Step 1893: {'lr': 0.000473, 'samples': 363456, 'steps': 1892, 'loss/train': 3.2066597938537598} +11/06/2021 21:32:18 - INFO - __main__ - Step 1894: {'lr': 0.00047325000000000004, 'samples': 363648, 'steps': 1893, 'loss/train': 2.5090718269348145} +11/06/2021 21:32:19 - INFO - __main__ - Step 1895: {'lr': 0.00047349999999999996, 'samples': 363840, 'steps': 1894, 'loss/train': 2.715529680252075} +11/06/2021 21:32:19 - INFO - __main__ - Step 1896: {'lr': 0.00047375, 'samples': 364032, 'steps': 1895, 'loss/train': 2.8144490718841553} +11/06/2021 21:32:20 - INFO - __main__ - Step 1897: {'lr': 0.000474, 'samples': 364224, 'steps': 1896, 'loss/train': 2.670848846435547} +11/06/2021 21:32:21 - INFO - __main__ - Step 1898: {'lr': 0.00047425, 'samples': 364416, 'steps': 1897, 'loss/train': 2.614722728729248} +11/06/2021 21:32:21 - INFO - __main__ - Step 1899: {'lr': 0.0004745, 'samples': 364608, 'steps': 1898, 'loss/train': 2.741778612136841} +11/06/2021 21:32:21 - INFO - __main__ - Step 1900: {'lr': 0.00047475, 'samples': 364800, 'steps': 1899, 'loss/train': 3.1232104301452637} +11/06/2021 21:32:22 - INFO - __main__ - Step 1901: {'lr': 0.000475, 'samples': 364992, 'steps': 1900, 'loss/train': 2.564000368118286} +11/06/2021 21:32:23 - INFO - __main__ - Step 1902: {'lr': 0.00047525000000000003, 'samples': 365184, 'steps': 1901, 'loss/train': 2.7664237022399902} +11/06/2021 21:32:23 - INFO - __main__ - Step 1903: {'lr': 0.0004755, 'samples': 365376, 'steps': 1902, 'loss/train': 2.554410934448242} +11/06/2021 21:32:23 - INFO - __main__ - Step 1904: {'lr': 0.00047575, 'samples': 365568, 'steps': 1903, 'loss/train': 2.5446524620056152} +11/06/2021 21:32:24 - INFO - __main__ - Step 1905: {'lr': 0.00047599999999999997, 'samples': 365760, 'steps': 1904, 'loss/train': 2.754312515258789} +11/06/2021 21:32:24 - INFO - __main__ - Step 1906: {'lr': 0.00047625, 'samples': 365952, 'steps': 1905, 'loss/train': 2.7138187885284424} +11/06/2021 21:32:25 - INFO - __main__ - Step 1907: {'lr': 0.0004765, 'samples': 366144, 'steps': 1906, 'loss/train': 2.9011712074279785} +11/06/2021 21:32:25 - INFO - __main__ - Step 1908: {'lr': 0.00047675, 'samples': 366336, 'steps': 1907, 'loss/train': 2.7939672470092773} +11/06/2021 21:32:26 - INFO - __main__ - Step 1909: {'lr': 0.000477, 'samples': 366528, 'steps': 1908, 'loss/train': 3.0879056453704834} +11/06/2021 21:32:26 - INFO - __main__ - Step 1910: {'lr': 0.00047725, 'samples': 366720, 'steps': 1909, 'loss/train': 2.4980082511901855} +11/06/2021 21:32:26 - INFO - __main__ - Step 1911: {'lr': 0.0004775, 'samples': 366912, 'steps': 1910, 'loss/train': 2.949843645095825} +11/06/2021 21:32:27 - INFO - __main__ - Step 1912: {'lr': 0.00047775000000000004, 'samples': 367104, 'steps': 1911, 'loss/train': 2.661370277404785} +11/06/2021 21:32:28 - INFO - __main__ - Step 1913: {'lr': 0.00047799999999999996, 'samples': 367296, 'steps': 1912, 'loss/train': 2.855457305908203} +11/06/2021 21:32:28 - INFO - __main__ - Step 1914: {'lr': 0.00047825, 'samples': 367488, 'steps': 1913, 'loss/train': 2.790748119354248} +11/06/2021 21:32:28 - INFO - __main__ - Step 1915: {'lr': 0.0004785, 'samples': 367680, 'steps': 1914, 'loss/train': 2.1920478343963623} +11/06/2021 21:32:29 - INFO - __main__ - Step 1916: {'lr': 0.00047875, 'samples': 367872, 'steps': 1915, 'loss/train': 3.010140895843506} +11/06/2021 21:32:30 - INFO - __main__ - Step 1917: {'lr': 0.000479, 'samples': 368064, 'steps': 1916, 'loss/train': 2.7934629917144775} +11/06/2021 21:32:30 - INFO - __main__ - Step 1918: {'lr': 0.00047925, 'samples': 368256, 'steps': 1917, 'loss/train': 2.759575128555298} +11/06/2021 21:32:31 - INFO - __main__ - Step 1919: {'lr': 0.0004795, 'samples': 368448, 'steps': 1918, 'loss/train': 2.1986517906188965} +11/06/2021 21:32:31 - INFO - __main__ - Step 1920: {'lr': 0.00047975000000000003, 'samples': 368640, 'steps': 1919, 'loss/train': 2.7708301544189453} +11/06/2021 21:32:31 - INFO - __main__ - Step 1921: {'lr': 0.00048, 'samples': 368832, 'steps': 1920, 'loss/train': 4.627929210662842} +11/06/2021 21:32:32 - INFO - __main__ - Step 1922: {'lr': 0.00048025000000000005, 'samples': 369024, 'steps': 1921, 'loss/train': 2.932852029800415} +11/06/2021 21:32:33 - INFO - __main__ - Step 1923: {'lr': 0.00048049999999999997, 'samples': 369216, 'steps': 1922, 'loss/train': 2.970147132873535} +11/06/2021 21:32:33 - INFO - __main__ - Step 1924: {'lr': 0.00048075, 'samples': 369408, 'steps': 1923, 'loss/train': 3.2570888996124268} +11/06/2021 21:32:33 - INFO - __main__ - Step 1925: {'lr': 0.000481, 'samples': 369600, 'steps': 1924, 'loss/train': 2.7547266483306885} +11/06/2021 21:32:34 - INFO - __main__ - Step 1926: {'lr': 0.00048125, 'samples': 369792, 'steps': 1925, 'loss/train': 2.5552988052368164} +11/06/2021 21:32:34 - INFO - __main__ - Step 1927: {'lr': 0.0004815, 'samples': 369984, 'steps': 1926, 'loss/train': 2.8720643520355225} +11/06/2021 21:32:35 - INFO - __main__ - Step 1928: {'lr': 0.00048175000000000003, 'samples': 370176, 'steps': 1927, 'loss/train': 3.4235241413116455} +11/06/2021 21:32:35 - INFO - __main__ - Step 1929: {'lr': 0.000482, 'samples': 370368, 'steps': 1928, 'loss/train': 2.794508457183838} +11/06/2021 21:32:36 - INFO - __main__ - Step 1930: {'lr': 0.00048225000000000004, 'samples': 370560, 'steps': 1929, 'loss/train': 3.3702750205993652} +11/06/2021 21:32:36 - INFO - __main__ - Step 1931: {'lr': 0.0004825, 'samples': 370752, 'steps': 1930, 'loss/train': 3.3786303997039795} +11/06/2021 21:32:36 - INFO - __main__ - Step 1932: {'lr': 0.00048275, 'samples': 370944, 'steps': 1931, 'loss/train': 2.7347774505615234} +11/06/2021 21:32:37 - INFO - __main__ - Step 1933: {'lr': 0.000483, 'samples': 371136, 'steps': 1932, 'loss/train': 2.8218722343444824} +11/06/2021 21:32:38 - INFO - __main__ - Step 1934: {'lr': 0.00048325, 'samples': 371328, 'steps': 1933, 'loss/train': 1.854628324508667} +11/06/2021 21:32:38 - INFO - __main__ - Step 1935: {'lr': 0.0004835, 'samples': 371520, 'steps': 1934, 'loss/train': 2.730201244354248} +11/06/2021 21:32:38 - INFO - __main__ - Step 1936: {'lr': 0.00048375, 'samples': 371712, 'steps': 1935, 'loss/train': 2.558645725250244} +11/06/2021 21:32:39 - INFO - __main__ - Step 1937: {'lr': 0.000484, 'samples': 371904, 'steps': 1936, 'loss/train': 2.328354597091675} +11/06/2021 21:32:40 - INFO - __main__ - Step 1938: {'lr': 0.00048425000000000003, 'samples': 372096, 'steps': 1937, 'loss/train': 2.217445135116577} +11/06/2021 21:32:40 - INFO - __main__ - Step 1939: {'lr': 0.0004845, 'samples': 372288, 'steps': 1938, 'loss/train': 2.765631675720215} +11/06/2021 21:32:41 - INFO - __main__ - Step 1940: {'lr': 0.00048475000000000005, 'samples': 372480, 'steps': 1939, 'loss/train': 2.3212947845458984} +11/06/2021 21:32:41 - INFO - __main__ - Step 1941: {'lr': 0.00048499999999999997, 'samples': 372672, 'steps': 1940, 'loss/train': 2.563457727432251} +11/06/2021 21:32:41 - INFO - __main__ - Step 1942: {'lr': 0.00048525, 'samples': 372864, 'steps': 1941, 'loss/train': 2.725562334060669} +11/06/2021 21:32:42 - INFO - __main__ - Step 1943: {'lr': 0.0004855, 'samples': 373056, 'steps': 1942, 'loss/train': 2.3403518199920654} +11/06/2021 21:32:43 - INFO - __main__ - Step 1944: {'lr': 0.00048575, 'samples': 373248, 'steps': 1943, 'loss/train': 2.5952484607696533} +11/06/2021 21:32:43 - INFO - __main__ - Step 1945: {'lr': 0.000486, 'samples': 373440, 'steps': 1944, 'loss/train': 3.019125461578369} +11/06/2021 21:32:43 - INFO - __main__ - Step 1946: {'lr': 0.00048625000000000003, 'samples': 373632, 'steps': 1945, 'loss/train': 2.831516981124878} +11/06/2021 21:32:44 - INFO - __main__ - Step 1947: {'lr': 0.0004865, 'samples': 373824, 'steps': 1946, 'loss/train': 2.3622794151306152} +11/06/2021 21:32:45 - INFO - __main__ - Step 1948: {'lr': 0.00048675000000000004, 'samples': 374016, 'steps': 1947, 'loss/train': 2.709298849105835} +11/06/2021 21:32:45 - INFO - __main__ - Step 1949: {'lr': 0.000487, 'samples': 374208, 'steps': 1948, 'loss/train': 2.702164888381958} +11/06/2021 21:32:45 - INFO - __main__ - Step 1950: {'lr': 0.00048725000000000005, 'samples': 374400, 'steps': 1949, 'loss/train': 2.7699882984161377} +11/06/2021 21:32:46 - INFO - __main__ - Step 1951: {'lr': 0.0004875, 'samples': 374592, 'steps': 1950, 'loss/train': 3.081878900527954} +11/06/2021 21:32:46 - INFO - __main__ - Step 1952: {'lr': 0.00048775, 'samples': 374784, 'steps': 1951, 'loss/train': 2.322448492050171} +11/06/2021 21:32:47 - INFO - __main__ - Step 1953: {'lr': 0.000488, 'samples': 374976, 'steps': 1952, 'loss/train': 3.033129930496216} +11/06/2021 21:32:48 - INFO - __main__ - Step 1954: {'lr': 0.00048825, 'samples': 375168, 'steps': 1953, 'loss/train': 3.0832743644714355} +11/06/2021 21:32:48 - INFO - __main__ - Step 1955: {'lr': 0.0004885, 'samples': 375360, 'steps': 1954, 'loss/train': 2.644732713699341} +11/06/2021 21:32:48 - INFO - __main__ - Step 1956: {'lr': 0.00048875, 'samples': 375552, 'steps': 1955, 'loss/train': 2.585529327392578} +11/06/2021 21:32:49 - INFO - __main__ - Step 1957: {'lr': 0.000489, 'samples': 375744, 'steps': 1956, 'loss/train': 2.618997812271118} +11/06/2021 21:32:49 - INFO - __main__ - Step 1958: {'lr': 0.00048925, 'samples': 375936, 'steps': 1957, 'loss/train': 2.3187615871429443} +11/06/2021 21:32:50 - INFO - __main__ - Step 1959: {'lr': 0.0004895, 'samples': 376128, 'steps': 1958, 'loss/train': 0.9907362461090088} +11/06/2021 21:32:50 - INFO - __main__ - Step 1960: {'lr': 0.0004897500000000001, 'samples': 376320, 'steps': 1959, 'loss/train': 2.583451986312866} +11/06/2021 21:32:51 - INFO - __main__ - Step 1961: {'lr': 0.00049, 'samples': 376512, 'steps': 1960, 'loss/train': 2.766582489013672} +11/06/2021 21:32:51 - INFO - __main__ - Step 1962: {'lr': 0.00049025, 'samples': 376704, 'steps': 1961, 'loss/train': 2.8893637657165527} +11/06/2021 21:32:51 - INFO - __main__ - Step 1963: {'lr': 0.0004905, 'samples': 376896, 'steps': 1962, 'loss/train': 2.1860101222991943} +11/06/2021 21:32:53 - INFO - __main__ - Step 1964: {'lr': 0.0004907500000000001, 'samples': 377088, 'steps': 1963, 'loss/train': 2.513594150543213} +11/06/2021 21:32:53 - INFO - __main__ - Step 1965: {'lr': 0.000491, 'samples': 377280, 'steps': 1964, 'loss/train': 1.6197631359100342} +11/06/2021 21:32:53 - INFO - __main__ - Step 1966: {'lr': 0.00049125, 'samples': 377472, 'steps': 1965, 'loss/train': 2.5828354358673096} +11/06/2021 21:32:54 - INFO - __main__ - Step 1967: {'lr': 0.0004915, 'samples': 377664, 'steps': 1966, 'loss/train': 3.0170748233795166} +11/06/2021 21:32:54 - INFO - __main__ - Step 1968: {'lr': 0.00049175, 'samples': 377856, 'steps': 1967, 'loss/train': 1.9359134435653687} +11/06/2021 21:32:55 - INFO - __main__ - Step 1969: {'lr': 0.000492, 'samples': 378048, 'steps': 1968, 'loss/train': 2.57096266746521} +11/06/2021 21:32:55 - INFO - __main__ - Step 1970: {'lr': 0.0004922500000000001, 'samples': 378240, 'steps': 1969, 'loss/train': 2.656981945037842} +11/06/2021 21:32:56 - INFO - __main__ - Step 1971: {'lr': 0.0004925, 'samples': 378432, 'steps': 1970, 'loss/train': 2.5854079723358154} +11/06/2021 21:32:56 - INFO - __main__ - Step 1972: {'lr': 0.00049275, 'samples': 378624, 'steps': 1971, 'loss/train': 2.834716796875} +11/06/2021 21:32:56 - INFO - __main__ - Step 1973: {'lr': 0.0004930000000000001, 'samples': 378816, 'steps': 1972, 'loss/train': 2.5970420837402344} +11/06/2021 21:32:57 - INFO - __main__ - Step 1974: {'lr': 0.00049325, 'samples': 379008, 'steps': 1973, 'loss/train': 2.524550676345825} +11/06/2021 21:32:58 - INFO - __main__ - Step 1975: {'lr': 0.0004935, 'samples': 379200, 'steps': 1974, 'loss/train': 2.7941884994506836} +11/06/2021 21:32:58 - INFO - __main__ - Step 1976: {'lr': 0.00049375, 'samples': 379392, 'steps': 1975, 'loss/train': 2.233511447906494} +11/06/2021 21:32:58 - INFO - __main__ - Step 1977: {'lr': 0.000494, 'samples': 379584, 'steps': 1976, 'loss/train': 2.7673490047454834} +11/06/2021 21:32:59 - INFO - __main__ - Step 1978: {'lr': 0.00049425, 'samples': 379776, 'steps': 1977, 'loss/train': 2.7276995182037354} +11/06/2021 21:32:59 - INFO - __main__ - Step 1979: {'lr': 0.0004945, 'samples': 379968, 'steps': 1978, 'loss/train': 3.163912534713745} +11/06/2021 21:33:00 - INFO - __main__ - Step 1980: {'lr': 0.0004947500000000001, 'samples': 380160, 'steps': 1979, 'loss/train': 2.734490394592285} +11/06/2021 21:33:00 - INFO - __main__ - Step 1981: {'lr': 0.000495, 'samples': 380352, 'steps': 1980, 'loss/train': 2.695145845413208} +11/06/2021 21:33:01 - INFO - __main__ - Step 1982: {'lr': 0.00049525, 'samples': 380544, 'steps': 1981, 'loss/train': 2.7770211696624756} +11/06/2021 21:33:01 - INFO - __main__ - Step 1983: {'lr': 0.0004955, 'samples': 380736, 'steps': 1982, 'loss/train': 2.7686867713928223} +11/06/2021 21:33:02 - INFO - __main__ - Step 1984: {'lr': 0.00049575, 'samples': 380928, 'steps': 1983, 'loss/train': 2.8708817958831787} +11/06/2021 21:33:03 - INFO - __main__ - Step 1985: {'lr': 0.000496, 'samples': 381120, 'steps': 1984, 'loss/train': 2.6449930667877197} +11/06/2021 21:33:03 - INFO - __main__ - Step 1986: {'lr': 0.0004962500000000001, 'samples': 381312, 'steps': 1985, 'loss/train': 2.249175786972046} +11/06/2021 21:33:03 - INFO - __main__ - Step 1987: {'lr': 0.0004965, 'samples': 381504, 'steps': 1986, 'loss/train': 2.399980068206787} +11/06/2021 21:33:04 - INFO - __main__ - Step 1988: {'lr': 0.00049675, 'samples': 381696, 'steps': 1987, 'loss/train': 2.932748556137085} +11/06/2021 21:33:04 - INFO - __main__ - Step 1989: {'lr': 0.000497, 'samples': 381888, 'steps': 1988, 'loss/train': 2.3569090366363525} +11/06/2021 21:33:05 - INFO - __main__ - Step 1990: {'lr': 0.0004972500000000001, 'samples': 382080, 'steps': 1989, 'loss/train': 2.4476397037506104} +11/06/2021 21:33:05 - INFO - __main__ - Step 1991: {'lr': 0.0004975, 'samples': 382272, 'steps': 1990, 'loss/train': 3.7033238410949707} +11/06/2021 21:33:06 - INFO - __main__ - Step 1992: {'lr': 0.00049775, 'samples': 382464, 'steps': 1991, 'loss/train': 2.872666835784912} +11/06/2021 21:33:06 - INFO - __main__ - Step 1993: {'lr': 0.000498, 'samples': 382656, 'steps': 1992, 'loss/train': 2.463730573654175} +11/06/2021 21:33:06 - INFO - __main__ - Step 1994: {'lr': 0.00049825, 'samples': 382848, 'steps': 1993, 'loss/train': 2.2862772941589355} +11/06/2021 21:33:07 - INFO - __main__ - Step 1995: {'lr': 0.0004985, 'samples': 383040, 'steps': 1994, 'loss/train': 2.9158213138580322} +11/06/2021 21:33:08 - INFO - __main__ - Step 1996: {'lr': 0.0004987500000000001, 'samples': 383232, 'steps': 1995, 'loss/train': 2.440356731414795} +11/06/2021 21:33:08 - INFO - __main__ - Step 1997: {'lr': 0.000499, 'samples': 383424, 'steps': 1996, 'loss/train': 2.8165547847747803} +11/06/2021 21:33:08 - INFO - __main__ - Step 1998: {'lr': 0.00049925, 'samples': 383616, 'steps': 1997, 'loss/train': 2.460160970687866} +11/06/2021 21:33:09 - INFO - __main__ - Step 1999: {'lr': 0.0004995, 'samples': 383808, 'steps': 1998, 'loss/train': 2.8963072299957275} +11/06/2021 21:33:10 - INFO - __main__ - Step 2000: {'lr': 0.0004997500000000001, 'samples': 384000, 'steps': 1999, 'loss/train': 2.667146921157837} +11/06/2021 21:33:10 - INFO - __main__ - Step 2001: {'lr': 0.0005, 'samples': 384192, 'steps': 2000, 'loss/train': 1.9915542602539062} +11/06/2021 21:33:10 - INFO - __main__ - Step 2002: {'lr': 0.0004999999999436769, 'samples': 384384, 'steps': 2001, 'loss/train': 2.369316816329956} +11/06/2021 21:33:11 - INFO - __main__ - Step 2003: {'lr': 0.0004999999997747077, 'samples': 384576, 'steps': 2002, 'loss/train': 2.117219924926758} +11/06/2021 21:33:11 - INFO - __main__ - Step 2004: {'lr': 0.0004999999994930923, 'samples': 384768, 'steps': 2003, 'loss/train': 3.217236280441284} +11/06/2021 21:33:12 - INFO - __main__ - Step 2005: {'lr': 0.0004999999990988309, 'samples': 384960, 'steps': 2004, 'loss/train': 2.4494330883026123} +11/06/2021 21:33:13 - INFO - __main__ - Step 2006: {'lr': 0.0004999999985919232, 'samples': 385152, 'steps': 2005, 'loss/train': 2.7397634983062744} +11/06/2021 21:33:13 - INFO - __main__ - Step 2007: {'lr': 0.0004999999979723695, 'samples': 385344, 'steps': 2006, 'loss/train': 1.72874915599823} +11/06/2021 21:33:13 - INFO - __main__ - Step 2008: {'lr': 0.0004999999972401696, 'samples': 385536, 'steps': 2007, 'loss/train': 2.854842185974121} +11/06/2021 21:33:14 - INFO - __main__ - Step 2009: {'lr': 0.0004999999963953234, 'samples': 385728, 'steps': 2008, 'loss/train': 2.8656506538391113} +11/06/2021 21:33:14 - INFO - __main__ - Step 2010: {'lr': 0.0004999999954378312, 'samples': 385920, 'steps': 2009, 'loss/train': 2.108156681060791} +11/06/2021 21:33:15 - INFO - __main__ - Step 2011: {'lr': 0.000499999994367693, 'samples': 386112, 'steps': 2010, 'loss/train': 2.626335382461548} +11/06/2021 21:33:15 - INFO - __main__ - Step 2012: {'lr': 0.0004999999931849084, 'samples': 386304, 'steps': 2011, 'loss/train': 2.684321403503418} +11/06/2021 21:33:16 - INFO - __main__ - Step 2013: {'lr': 0.0004999999918894778, 'samples': 386496, 'steps': 2012, 'loss/train': 2.6967201232910156} +11/06/2021 21:33:16 - INFO - __main__ - Step 2014: {'lr': 0.000499999990481401, 'samples': 386688, 'steps': 2013, 'loss/train': 2.6608567237854004} +11/06/2021 21:33:16 - INFO - __main__ - Step 2015: {'lr': 0.0004999999889606781, 'samples': 386880, 'steps': 2014, 'loss/train': 2.773587942123413} +11/06/2021 21:33:17 - INFO - __main__ - Step 2016: {'lr': 0.0004999999873273091, 'samples': 387072, 'steps': 2015, 'loss/train': 2.5396175384521484} +11/06/2021 21:33:18 - INFO - __main__ - Step 2017: {'lr': 0.000499999985581294, 'samples': 387264, 'steps': 2016, 'loss/train': 2.9286653995513916} +11/06/2021 21:33:18 - INFO - __main__ - Step 2018: {'lr': 0.0004999999837226326, 'samples': 387456, 'steps': 2017, 'loss/train': 2.4174294471740723} +11/06/2021 21:33:18 - INFO - __main__ - Step 2019: {'lr': 0.0004999999817513252, 'samples': 387648, 'steps': 2018, 'loss/train': 2.4650332927703857} +11/06/2021 21:33:19 - INFO - __main__ - Step 2020: {'lr': 0.0004999999796673716, 'samples': 387840, 'steps': 2019, 'loss/train': 2.799029588699341} +11/06/2021 21:33:20 - INFO - __main__ - Step 2021: {'lr': 0.0004999999774707719, 'samples': 388032, 'steps': 2020, 'loss/train': 2.8545684814453125} +11/06/2021 21:33:20 - INFO - __main__ - Step 2022: {'lr': 0.0004999999751615261, 'samples': 388224, 'steps': 2021, 'loss/train': 2.4763200283050537} +11/06/2021 21:33:20 - INFO - __main__ - Step 2023: {'lr': 0.0004999999727396341, 'samples': 388416, 'steps': 2022, 'loss/train': 2.094083309173584} +11/06/2021 21:33:21 - INFO - __main__ - Step 2024: {'lr': 0.0004999999702050959, 'samples': 388608, 'steps': 2023, 'loss/train': 2.4490573406219482} +11/06/2021 21:33:21 - INFO - __main__ - Step 2025: {'lr': 0.0004999999675579118, 'samples': 388800, 'steps': 2024, 'loss/train': 3.2666213512420654} +11/06/2021 21:33:22 - INFO - __main__ - Step 2026: {'lr': 0.0004999999647980814, 'samples': 388992, 'steps': 2025, 'loss/train': 2.2224512100219727} +11/06/2021 21:33:23 - INFO - __main__ - Step 2027: {'lr': 0.0004999999619256049, 'samples': 389184, 'steps': 2026, 'loss/train': 3.0559303760528564} +11/06/2021 21:33:23 - INFO - __main__ - Step 2028: {'lr': 0.0004999999589404822, 'samples': 389376, 'steps': 2027, 'loss/train': 2.4753761291503906} +11/06/2021 21:33:23 - INFO - __main__ - Step 2029: {'lr': 0.0004999999558427136, 'samples': 389568, 'steps': 2028, 'loss/train': 2.350665807723999} +11/06/2021 21:33:24 - INFO - __main__ - Step 2030: {'lr': 0.0004999999526322987, 'samples': 389760, 'steps': 2029, 'loss/train': 2.9428741931915283} +11/06/2021 21:33:24 - INFO - __main__ - Step 2031: {'lr': 0.0004999999493092377, 'samples': 389952, 'steps': 2030, 'loss/train': 2.561460018157959} +11/06/2021 21:33:25 - INFO - __main__ - Step 2032: {'lr': 0.0004999999458735306, 'samples': 390144, 'steps': 2031, 'loss/train': 2.2386529445648193} +11/06/2021 21:33:26 - INFO - __main__ - Step 2033: {'lr': 0.0004999999423251774, 'samples': 390336, 'steps': 2032, 'loss/train': 2.3020198345184326} +11/06/2021 21:33:26 - INFO - __main__ - Step 2034: {'lr': 0.0004999999386641781, 'samples': 390528, 'steps': 2033, 'loss/train': 2.7840397357940674} +11/06/2021 21:33:26 - INFO - __main__ - Step 2035: {'lr': 0.0004999999348905326, 'samples': 390720, 'steps': 2034, 'loss/train': 2.2460341453552246} +11/06/2021 21:33:27 - INFO - __main__ - Step 2036: {'lr': 0.000499999931004241, 'samples': 390912, 'steps': 2035, 'loss/train': 2.3942503929138184} +11/06/2021 21:33:28 - INFO - __main__ - Step 2037: {'lr': 0.0004999999270053034, 'samples': 391104, 'steps': 2036, 'loss/train': 3.297150135040283} +11/06/2021 21:33:28 - INFO - __main__ - Step 2038: {'lr': 0.0004999999228937196, 'samples': 391296, 'steps': 2037, 'loss/train': 2.8241195678710938} +11/06/2021 21:33:28 - INFO - __main__ - Step 2039: {'lr': 0.0004999999186694897, 'samples': 391488, 'steps': 2038, 'loss/train': 2.7766733169555664} +11/06/2021 21:33:29 - INFO - __main__ - Step 2040: {'lr': 0.0004999999143326137, 'samples': 391680, 'steps': 2039, 'loss/train': 2.7513749599456787} +11/06/2021 21:33:29 - INFO - __main__ - Step 2041: {'lr': 0.0004999999098830916, 'samples': 391872, 'steps': 2040, 'loss/train': 2.4639899730682373} +11/06/2021 21:33:30 - INFO - __main__ - Step 2042: {'lr': 0.0004999999053209235, 'samples': 392064, 'steps': 2041, 'loss/train': 2.83908748626709} +11/06/2021 21:33:30 - INFO - __main__ - Step 2043: {'lr': 0.0004999999006461091, 'samples': 392256, 'steps': 2042, 'loss/train': 2.7250239849090576} +11/06/2021 21:33:31 - INFO - __main__ - Step 2044: {'lr': 0.0004999998958586487, 'samples': 392448, 'steps': 2043, 'loss/train': 2.2710461616516113} +11/06/2021 21:33:31 - INFO - __main__ - Step 2045: {'lr': 0.0004999998909585423, 'samples': 392640, 'steps': 2044, 'loss/train': 2.9703567028045654} +11/06/2021 21:33:31 - INFO - __main__ - Step 2046: {'lr': 0.0004999998859457896, 'samples': 392832, 'steps': 2045, 'loss/train': 1.9827837944030762} +11/06/2021 21:33:33 - INFO - __main__ - Step 2047: {'lr': 0.0004999998808203909, 'samples': 393024, 'steps': 2046, 'loss/train': 2.4545347690582275} +11/06/2021 21:33:33 - INFO - __main__ - Step 2048: {'lr': 0.0004999998755823462, 'samples': 393216, 'steps': 2047, 'loss/train': 2.7062439918518066} +11/06/2021 21:33:33 - INFO - __main__ - Step 2049: {'lr': 0.0004999998702316553, 'samples': 393408, 'steps': 2048, 'loss/train': 2.6722590923309326} +11/06/2021 21:33:34 - INFO - __main__ - Step 2050: {'lr': 0.0004999998647683184, 'samples': 393600, 'steps': 2049, 'loss/train': 2.4513065814971924} +11/06/2021 21:33:34 - INFO - __main__ - Step 2051: {'lr': 0.0004999998591923353, 'samples': 393792, 'steps': 2050, 'loss/train': 2.691094398498535} +11/06/2021 21:33:34 - INFO - __main__ - Step 2052: {'lr': 0.0004999998535037063, 'samples': 393984, 'steps': 2051, 'loss/train': 2.209742307662964} +11/06/2021 21:33:35 - INFO - __main__ - Step 2053: {'lr': 0.0004999998477024311, 'samples': 394176, 'steps': 2052, 'loss/train': 2.50882887840271} +11/06/2021 21:33:36 - INFO - __main__ - Step 2054: {'lr': 0.0004999998417885099, 'samples': 394368, 'steps': 2053, 'loss/train': 2.435020685195923} +11/06/2021 21:33:36 - INFO - __main__ - Step 2055: {'lr': 0.0004999998357619425, 'samples': 394560, 'steps': 2054, 'loss/train': 2.0775961875915527} +11/06/2021 21:33:36 - INFO - __main__ - Step 2056: {'lr': 0.0004999998296227291, 'samples': 394752, 'steps': 2055, 'loss/train': 2.863607168197632} +11/06/2021 21:33:37 - INFO - __main__ - Step 2057: {'lr': 0.0004999998233708697, 'samples': 394944, 'steps': 2056, 'loss/train': 2.371857166290283} +11/06/2021 21:33:38 - INFO - __main__ - Step 2058: {'lr': 0.0004999998170063642, 'samples': 395136, 'steps': 2057, 'loss/train': 2.9623489379882812} +11/06/2021 21:33:38 - INFO - __main__ - Step 2059: {'lr': 0.0004999998105292126, 'samples': 395328, 'steps': 2058, 'loss/train': 2.637700319290161} +11/06/2021 21:33:39 - INFO - __main__ - Step 2060: {'lr': 0.000499999803939415, 'samples': 395520, 'steps': 2059, 'loss/train': 2.8465237617492676} +11/06/2021 21:33:39 - INFO - __main__ - Step 2061: {'lr': 0.0004999997972369713, 'samples': 395712, 'steps': 2060, 'loss/train': 2.0144639015197754} +11/06/2021 21:33:39 - INFO - __main__ - Step 2062: {'lr': 0.0004999997904218816, 'samples': 395904, 'steps': 2061, 'loss/train': 2.385756254196167} +11/06/2021 21:33:40 - INFO - __main__ - Step 2063: {'lr': 0.0004999997834941459, 'samples': 396096, 'steps': 2062, 'loss/train': 3.102501153945923} +11/06/2021 21:33:41 - INFO - __main__ - Step 2064: {'lr': 0.000499999776453764, 'samples': 396288, 'steps': 2063, 'loss/train': 1.95815908908844} +11/06/2021 21:33:41 - INFO - __main__ - Step 2065: {'lr': 0.0004999997693007361, 'samples': 396480, 'steps': 2064, 'loss/train': 2.9032347202301025} +11/06/2021 21:33:41 - INFO - __main__ - Step 2066: {'lr': 0.0004999997620350622, 'samples': 396672, 'steps': 2065, 'loss/train': 2.321173906326294} +11/06/2021 21:33:42 - INFO - __main__ - Step 2067: {'lr': 0.0004999997546567423, 'samples': 396864, 'steps': 2066, 'loss/train': 2.925659418106079} +11/06/2021 21:33:42 - INFO - __main__ - Step 2068: {'lr': 0.0004999997471657763, 'samples': 397056, 'steps': 2067, 'loss/train': 2.795663356781006} +11/06/2021 21:33:43 - INFO - __main__ - Step 2069: {'lr': 0.0004999997395621642, 'samples': 397248, 'steps': 2068, 'loss/train': 2.198864698410034} +11/06/2021 21:33:43 - INFO - __main__ - Step 2070: {'lr': 0.0004999997318459064, 'samples': 397440, 'steps': 2069, 'loss/train': 2.6380443572998047} +11/06/2021 21:33:44 - INFO - __main__ - Step 2071: {'lr': 0.0004999997240170023, 'samples': 397632, 'steps': 2070, 'loss/train': 1.3615984916687012} +11/06/2021 21:33:44 - INFO - __main__ - Step 2072: {'lr': 0.0004999997160754522, 'samples': 397824, 'steps': 2071, 'loss/train': 2.0112996101379395} +11/06/2021 21:33:45 - INFO - __main__ - Step 2073: {'lr': 0.0004999997080212561, 'samples': 398016, 'steps': 2072, 'loss/train': 2.477386236190796} +11/06/2021 21:33:46 - INFO - __main__ - Step 2074: {'lr': 0.000499999699854414, 'samples': 398208, 'steps': 2073, 'loss/train': 3.2133283615112305} +11/06/2021 21:33:46 - INFO - __main__ - Step 2075: {'lr': 0.0004999996915749259, 'samples': 398400, 'steps': 2074, 'loss/train': 2.5600574016571045} +11/06/2021 21:33:46 - INFO - __main__ - Step 2076: {'lr': 0.0004999996831827918, 'samples': 398592, 'steps': 2075, 'loss/train': 2.0490965843200684} +11/06/2021 21:33:47 - INFO - __main__ - Step 2077: {'lr': 0.0004999996746780117, 'samples': 398784, 'steps': 2076, 'loss/train': 2.4900460243225098} +11/06/2021 21:33:47 - INFO - __main__ - Step 2078: {'lr': 0.0004999996660605856, 'samples': 398976, 'steps': 2077, 'loss/train': 2.7026772499084473} +11/06/2021 21:33:47 - INFO - __main__ - Step 2079: {'lr': 0.0004999996573305135, 'samples': 399168, 'steps': 2078, 'loss/train': 1.7970755100250244} +11/06/2021 21:33:48 - INFO - __main__ - Step 2080: {'lr': 0.0004999996484877955, 'samples': 399360, 'steps': 2079, 'loss/train': 2.834831953048706} +11/06/2021 21:33:49 - INFO - __main__ - Step 2081: {'lr': 0.0004999996395324313, 'samples': 399552, 'steps': 2080, 'loss/train': 2.1271467208862305} +11/06/2021 21:33:49 - INFO - __main__ - Step 2082: {'lr': 0.0004999996304644213, 'samples': 399744, 'steps': 2081, 'loss/train': 2.7261979579925537} +11/06/2021 21:33:49 - INFO - __main__ - Step 2083: {'lr': 0.0004999996212837653, 'samples': 399936, 'steps': 2082, 'loss/train': 2.50911021232605} +11/06/2021 21:33:50 - INFO - __main__ - Step 2084: {'lr': 0.0004999996119904633, 'samples': 400128, 'steps': 2083, 'loss/train': 2.5453062057495117} +11/06/2021 21:33:51 - INFO - __main__ - Step 2085: {'lr': 0.0004999996025845154, 'samples': 400320, 'steps': 2084, 'loss/train': 2.562901496887207} +11/06/2021 21:33:51 - INFO - __main__ - Step 2086: {'lr': 0.0004999995930659215, 'samples': 400512, 'steps': 2085, 'loss/train': 2.8472900390625} +11/06/2021 21:33:51 - INFO - __main__ - Step 2087: {'lr': 0.0004999995834346815, 'samples': 400704, 'steps': 2086, 'loss/train': 2.197766065597534} +11/06/2021 21:33:52 - INFO - __main__ - Step 2088: {'lr': 0.0004999995736907957, 'samples': 400896, 'steps': 2087, 'loss/train': 2.4093174934387207} +11/06/2021 21:33:52 - INFO - __main__ - Step 2089: {'lr': 0.000499999563834264, 'samples': 401088, 'steps': 2088, 'loss/train': 2.8441734313964844} +11/06/2021 21:33:53 - INFO - __main__ - Step 2090: {'lr': 0.0004999995538650862, 'samples': 401280, 'steps': 2089, 'loss/train': 2.863389492034912} +11/06/2021 21:33:53 - INFO - __main__ - Step 2091: {'lr': 0.0004999995437832626, 'samples': 401472, 'steps': 2090, 'loss/train': 2.4036967754364014} +11/06/2021 21:33:54 - INFO - __main__ - Step 2092: {'lr': 0.0004999995335887929, 'samples': 401664, 'steps': 2091, 'loss/train': 2.5592567920684814} +11/06/2021 21:33:54 - INFO - __main__ - Step 2093: {'lr': 0.0004999995232816774, 'samples': 401856, 'steps': 2092, 'loss/train': 2.0404558181762695} +11/06/2021 21:33:54 - INFO - __main__ - Step 2094: {'lr': 0.000499999512861916, 'samples': 402048, 'steps': 2093, 'loss/train': 2.452481985092163} +11/06/2021 21:33:56 - INFO - __main__ - Step 2095: {'lr': 0.0004999995023295086, 'samples': 402240, 'steps': 2094, 'loss/train': 2.8676137924194336} +11/06/2021 21:33:56 - INFO - __main__ - Step 2096: {'lr': 0.0004999994916844552, 'samples': 402432, 'steps': 2095, 'loss/train': 2.586151599884033} +11/06/2021 21:33:56 - INFO - __main__ - Step 2097: {'lr': 0.0004999994809267561, 'samples': 402624, 'steps': 2096, 'loss/train': 2.180725574493408} +11/06/2021 21:33:57 - INFO - __main__ - Step 2098: {'lr': 0.0004999994700564109, 'samples': 402816, 'steps': 2097, 'loss/train': 2.6748390197753906} +11/06/2021 21:33:57 - INFO - __main__ - Step 2099: {'lr': 0.0004999994590734199, 'samples': 403008, 'steps': 2098, 'loss/train': 2.2900843620300293} +11/06/2021 21:33:58 - INFO - __main__ - Step 2100: {'lr': 0.000499999447977783, 'samples': 403200, 'steps': 2099, 'loss/train': 2.7498953342437744} +11/06/2021 21:33:58 - INFO - __main__ - Step 2101: {'lr': 0.0004999994367695001, 'samples': 403392, 'steps': 2100, 'loss/train': 2.9146597385406494} +11/06/2021 21:33:59 - INFO - __main__ - Step 2102: {'lr': 0.0004999994254485714, 'samples': 403584, 'steps': 2101, 'loss/train': 2.650158166885376} +11/06/2021 21:33:59 - INFO - __main__ - Step 2103: {'lr': 0.0004999994140149969, 'samples': 403776, 'steps': 2102, 'loss/train': 2.6396777629852295} +11/06/2021 21:33:59 - INFO - __main__ - Step 2104: {'lr': 0.0004999994024687764, 'samples': 403968, 'steps': 2103, 'loss/train': 2.664414644241333} +11/06/2021 21:34:00 - INFO - __main__ - Step 2105: {'lr': 0.00049999939080991, 'samples': 404160, 'steps': 2104, 'loss/train': 1.7636381387710571} +11/06/2021 21:34:01 - INFO - __main__ - Step 2106: {'lr': 0.0004999993790383978, 'samples': 404352, 'steps': 2105, 'loss/train': 2.3601715564727783} +11/06/2021 21:34:01 - INFO - __main__ - Step 2107: {'lr': 0.0004999993671542397, 'samples': 404544, 'steps': 2106, 'loss/train': 1.9566963911056519} +11/06/2021 21:34:01 - INFO - __main__ - Step 2108: {'lr': 0.0004999993551574358, 'samples': 404736, 'steps': 2107, 'loss/train': 1.9892882108688354} +11/06/2021 21:34:02 - INFO - __main__ - Step 2109: {'lr': 0.000499999343047986, 'samples': 404928, 'steps': 2108, 'loss/train': 2.693075180053711} +11/06/2021 21:34:02 - INFO - __main__ - Step 2110: {'lr': 0.0004999993308258904, 'samples': 405120, 'steps': 2109, 'loss/train': 2.1097216606140137} +11/06/2021 21:34:03 - INFO - __main__ - Step 2111: {'lr': 0.0004999993184911489, 'samples': 405312, 'steps': 2110, 'loss/train': 2.149388074874878} +11/06/2021 21:34:04 - INFO - __main__ - Step 2112: {'lr': 0.0004999993060437616, 'samples': 405504, 'steps': 2111, 'loss/train': 1.7287077903747559} +11/06/2021 21:34:04 - INFO - __main__ - Step 2113: {'lr': 0.0004999992934837284, 'samples': 405696, 'steps': 2112, 'loss/train': 2.66508150100708} +11/06/2021 21:34:04 - INFO - __main__ - Step 2114: {'lr': 0.0004999992808110495, 'samples': 405888, 'steps': 2113, 'loss/train': 2.4178295135498047} +11/06/2021 21:34:05 - INFO - __main__ - Step 2115: {'lr': 0.0004999992680257247, 'samples': 406080, 'steps': 2114, 'loss/train': 2.6689789295196533} +11/06/2021 21:34:06 - INFO - __main__ - Step 2116: {'lr': 0.0004999992551277541, 'samples': 406272, 'steps': 2115, 'loss/train': 2.902282953262329} +11/06/2021 21:34:06 - INFO - __main__ - Step 2117: {'lr': 0.0004999992421171377, 'samples': 406464, 'steps': 2116, 'loss/train': 2.81160306930542} +11/06/2021 21:34:06 - INFO - __main__ - Step 2118: {'lr': 0.0004999992289938755, 'samples': 406656, 'steps': 2117, 'loss/train': 2.694124698638916} +11/06/2021 21:34:07 - INFO - __main__ - Step 2119: {'lr': 0.0004999992157579676, 'samples': 406848, 'steps': 2118, 'loss/train': 3.20439076423645} +11/06/2021 21:34:07 - INFO - __main__ - Step 2120: {'lr': 0.0004999992024094138, 'samples': 407040, 'steps': 2119, 'loss/train': 2.9919791221618652} +11/06/2021 21:34:08 - INFO - __main__ - Step 2121: {'lr': 0.0004999991889482142, 'samples': 407232, 'steps': 2120, 'loss/train': 2.432868003845215} +11/06/2021 21:34:08 - INFO - __main__ - Step 2122: {'lr': 0.0004999991753743689, 'samples': 407424, 'steps': 2121, 'loss/train': 2.5452983379364014} +11/06/2021 21:34:09 - INFO - __main__ - Step 2123: {'lr': 0.0004999991616878777, 'samples': 407616, 'steps': 2122, 'loss/train': 2.8512609004974365} +11/06/2021 21:34:09 - INFO - __main__ - Step 2124: {'lr': 0.0004999991478887409, 'samples': 407808, 'steps': 2123, 'loss/train': 2.363013505935669} +11/06/2021 21:34:09 - INFO - __main__ - Step 2125: {'lr': 0.0004999991339769582, 'samples': 408000, 'steps': 2124, 'loss/train': 2.3409323692321777} +11/06/2021 21:34:10 - INFO - __main__ - Step 2126: {'lr': 0.0004999991199525299, 'samples': 408192, 'steps': 2125, 'loss/train': 2.357633113861084} +11/06/2021 21:34:11 - INFO - __main__ - Step 2127: {'lr': 0.0004999991058154557, 'samples': 408384, 'steps': 2126, 'loss/train': 2.454667091369629} +11/06/2021 21:34:11 - INFO - __main__ - Step 2128: {'lr': 0.0004999990915657359, 'samples': 408576, 'steps': 2127, 'loss/train': 1.9439713954925537} +11/06/2021 21:34:11 - INFO - __main__ - Step 2129: {'lr': 0.0004999990772033702, 'samples': 408768, 'steps': 2128, 'loss/train': 2.639913320541382} +11/06/2021 21:34:12 - INFO - __main__ - Step 2130: {'lr': 0.000499999062728359, 'samples': 408960, 'steps': 2129, 'loss/train': 2.727692127227783} +11/06/2021 21:34:12 - INFO - __main__ - Step 2131: {'lr': 0.0004999990481407018, 'samples': 409152, 'steps': 2130, 'loss/train': 2.4127743244171143} +11/06/2021 21:34:13 - INFO - __main__ - Step 2132: {'lr': 0.0004999990334403991, 'samples': 409344, 'steps': 2131, 'loss/train': 2.539153575897217} +11/06/2021 21:34:14 - INFO - __main__ - Step 2133: {'lr': 0.0004999990186274506, 'samples': 409536, 'steps': 2132, 'loss/train': 2.580580949783325} +11/06/2021 21:34:14 - INFO - __main__ - Step 2134: {'lr': 0.0004999990037018564, 'samples': 409728, 'steps': 2133, 'loss/train': 2.830368757247925} +11/06/2021 21:34:14 - INFO - __main__ - Step 2135: {'lr': 0.0004999989886636166, 'samples': 409920, 'steps': 2134, 'loss/train': 2.996830463409424} +11/06/2021 21:34:15 - INFO - __main__ - Step 2136: {'lr': 0.000499998973512731, 'samples': 410112, 'steps': 2135, 'loss/train': 2.449648141860962} +11/06/2021 21:34:16 - INFO - __main__ - Step 2137: {'lr': 0.0004999989582491998, 'samples': 410304, 'steps': 2136, 'loss/train': 2.1310882568359375} +11/06/2021 21:34:16 - INFO - __main__ - Step 2138: {'lr': 0.0004999989428730229, 'samples': 410496, 'steps': 2137, 'loss/train': 2.7264044284820557} +11/06/2021 21:34:17 - INFO - __main__ - Step 2139: {'lr': 0.0004999989273842003, 'samples': 410688, 'steps': 2138, 'loss/train': 2.348263740539551} +11/06/2021 21:34:17 - INFO - __main__ - Step 2140: {'lr': 0.0004999989117827321, 'samples': 410880, 'steps': 2139, 'loss/train': 2.6819005012512207} +11/06/2021 21:34:17 - INFO - __main__ - Step 2141: {'lr': 0.0004999988960686182, 'samples': 411072, 'steps': 2140, 'loss/train': 1.7351843118667603} +11/06/2021 21:34:18 - INFO - __main__ - Step 2142: {'lr': 0.0004999988802418587, 'samples': 411264, 'steps': 2141, 'loss/train': 2.5951883792877197} +11/06/2021 21:34:19 - INFO - __main__ - Step 2143: {'lr': 0.0004999988643024536, 'samples': 411456, 'steps': 2142, 'loss/train': 2.5091636180877686} +11/06/2021 21:34:19 - INFO - __main__ - Step 2144: {'lr': 0.0004999988482504027, 'samples': 411648, 'steps': 2143, 'loss/train': 2.721625804901123} +11/06/2021 21:34:19 - INFO - __main__ - Step 2145: {'lr': 0.0004999988320857063, 'samples': 411840, 'steps': 2144, 'loss/train': 2.778151750564575} +11/06/2021 21:34:20 - INFO - __main__ - Step 2146: {'lr': 0.0004999988158083643, 'samples': 412032, 'steps': 2145, 'loss/train': 2.607226848602295} +11/06/2021 21:34:20 - INFO - __main__ - Step 2147: {'lr': 0.0004999987994183766, 'samples': 412224, 'steps': 2146, 'loss/train': 2.325345277786255} +11/06/2021 21:34:21 - INFO - __main__ - Step 2148: {'lr': 0.0004999987829157434, 'samples': 412416, 'steps': 2147, 'loss/train': 2.363879442214966} +11/06/2021 21:34:21 - INFO - __main__ - Step 2149: {'lr': 0.0004999987663004646, 'samples': 412608, 'steps': 2148, 'loss/train': 2.3791654109954834} +11/06/2021 21:34:22 - INFO - __main__ - Step 2150: {'lr': 0.0004999987495725401, 'samples': 412800, 'steps': 2149, 'loss/train': 1.6959710121154785} +11/06/2021 21:34:22 - INFO - __main__ - Step 2151: {'lr': 0.0004999987327319701, 'samples': 412992, 'steps': 2150, 'loss/train': 2.9837472438812256} +11/06/2021 21:34:22 - INFO - __main__ - Step 2152: {'lr': 0.0004999987157787546, 'samples': 413184, 'steps': 2151, 'loss/train': 2.8918848037719727} +11/06/2021 21:34:24 - INFO - __main__ - Step 2153: {'lr': 0.0004999986987128934, 'samples': 413376, 'steps': 2152, 'loss/train': 2.0959744453430176} +11/06/2021 21:34:24 - INFO - __main__ - Step 2154: {'lr': 0.0004999986815343867, 'samples': 413568, 'steps': 2153, 'loss/train': 2.464357614517212} +11/06/2021 21:34:24 - INFO - __main__ - Step 2155: {'lr': 0.0004999986642432345, 'samples': 413760, 'steps': 2154, 'loss/train': 2.6230199337005615} +11/06/2021 21:34:25 - INFO - __main__ - Step 2156: {'lr': 0.0004999986468394367, 'samples': 413952, 'steps': 2155, 'loss/train': 2.50052547454834} +11/06/2021 21:34:25 - INFO - __main__ - Step 2157: {'lr': 0.0004999986293229934, 'samples': 414144, 'steps': 2156, 'loss/train': 2.743523359298706} +11/06/2021 21:34:26 - INFO - __main__ - Step 2158: {'lr': 0.0004999986116939045, 'samples': 414336, 'steps': 2157, 'loss/train': 2.9330990314483643} +11/06/2021 21:34:26 - INFO - __main__ - Step 2159: {'lr': 0.0004999985939521702, 'samples': 414528, 'steps': 2158, 'loss/train': 3.325244426727295} +11/06/2021 21:34:27 - INFO - __main__ - Step 2160: {'lr': 0.0004999985760977903, 'samples': 414720, 'steps': 2159, 'loss/train': 2.2128641605377197} +11/06/2021 21:34:27 - INFO - __main__ - Step 2161: {'lr': 0.000499998558130765, 'samples': 414912, 'steps': 2160, 'loss/train': 2.9361557960510254} +11/06/2021 21:34:27 - INFO - __main__ - Step 2162: {'lr': 0.0004999985400510941, 'samples': 415104, 'steps': 2161, 'loss/train': 2.5086746215820312} +11/06/2021 21:34:28 - INFO - __main__ - Step 2163: {'lr': 0.0004999985218587777, 'samples': 415296, 'steps': 2162, 'loss/train': 1.6962592601776123} +11/06/2021 21:34:29 - INFO - __main__ - Step 2164: {'lr': 0.0004999985035538159, 'samples': 415488, 'steps': 2163, 'loss/train': 2.615097761154175} +11/06/2021 21:34:29 - INFO - __main__ - Step 2165: {'lr': 0.0004999984851362086, 'samples': 415680, 'steps': 2164, 'loss/train': 2.722036600112915} +11/06/2021 21:34:29 - INFO - __main__ - Step 2166: {'lr': 0.0004999984666059559, 'samples': 415872, 'steps': 2165, 'loss/train': 2.560600996017456} +11/06/2021 21:34:30 - INFO - __main__ - Step 2167: {'lr': 0.0004999984479630577, 'samples': 416064, 'steps': 2166, 'loss/train': 2.6970345973968506} +11/06/2021 21:34:30 - INFO - __main__ - Step 2168: {'lr': 0.000499998429207514, 'samples': 416256, 'steps': 2167, 'loss/train': 2.9107210636138916} +11/06/2021 21:34:31 - INFO - __main__ - Step 2169: {'lr': 0.000499998410339325, 'samples': 416448, 'steps': 2168, 'loss/train': 2.580718994140625} +11/06/2021 21:34:32 - INFO - __main__ - Step 2170: {'lr': 0.0004999983913584904, 'samples': 416640, 'steps': 2169, 'loss/train': 2.8567304611206055} +11/06/2021 21:34:32 - INFO - __main__ - Step 2171: {'lr': 0.0004999983722650106, 'samples': 416832, 'steps': 2170, 'loss/train': 2.371682643890381} +11/06/2021 21:34:32 - INFO - __main__ - Step 2172: {'lr': 0.0004999983530588853, 'samples': 417024, 'steps': 2171, 'loss/train': 2.061142921447754} +11/06/2021 21:34:33 - INFO - __main__ - Step 2173: {'lr': 0.0004999983337401145, 'samples': 417216, 'steps': 2172, 'loss/train': 2.451244354248047} +11/06/2021 21:34:34 - INFO - __main__ - Step 2174: {'lr': 0.0004999983143086984, 'samples': 417408, 'steps': 2173, 'loss/train': 1.99120032787323} +11/06/2021 21:34:34 - INFO - __main__ - Step 2175: {'lr': 0.0004999982947646368, 'samples': 417600, 'steps': 2174, 'loss/train': 2.0224850177764893} +11/06/2021 21:34:34 - INFO - __main__ - Step 2176: {'lr': 0.00049999827510793, 'samples': 417792, 'steps': 2175, 'loss/train': 2.3628859519958496} +11/06/2021 21:34:35 - INFO - __main__ - Step 2177: {'lr': 0.0004999982553385778, 'samples': 417984, 'steps': 2176, 'loss/train': 2.5779266357421875} +11/06/2021 21:34:35 - INFO - __main__ - Step 2178: {'lr': 0.0004999982354565802, 'samples': 418176, 'steps': 2177, 'loss/train': 2.631287097930908} +11/06/2021 21:34:36 - INFO - __main__ - Step 2179: {'lr': 0.0004999982154619372, 'samples': 418368, 'steps': 2178, 'loss/train': 2.691127300262451} +11/06/2021 21:34:36 - INFO - __main__ - Step 2180: {'lr': 0.000499998195354649, 'samples': 418560, 'steps': 2179, 'loss/train': 2.6451637744903564} +11/06/2021 21:34:37 - INFO - __main__ - Step 2181: {'lr': 0.0004999981751347153, 'samples': 418752, 'steps': 2180, 'loss/train': 3.3670623302459717} +11/06/2021 21:34:37 - INFO - __main__ - Step 2182: {'lr': 0.0004999981548021364, 'samples': 418944, 'steps': 2181, 'loss/train': 2.2093632221221924} +11/06/2021 21:34:37 - INFO - __main__ - Step 2183: {'lr': 0.0004999981343569122, 'samples': 419136, 'steps': 2182, 'loss/train': 2.704352855682373} +11/06/2021 21:34:38 - INFO - __main__ - Step 2184: {'lr': 0.0004999981137990425, 'samples': 419328, 'steps': 2183, 'loss/train': 3.1171112060546875} +11/06/2021 21:34:39 - INFO - __main__ - Step 2185: {'lr': 0.0004999980931285278, 'samples': 419520, 'steps': 2184, 'loss/train': 2.5423855781555176} +11/06/2021 21:34:39 - INFO - __main__ - Step 2186: {'lr': 0.0004999980723453676, 'samples': 419712, 'steps': 2185, 'loss/train': 1.9052900075912476} +11/06/2021 21:34:40 - INFO - __main__ - Step 2187: {'lr': 0.0004999980514495623, 'samples': 419904, 'steps': 2186, 'loss/train': 2.7308359146118164} +11/06/2021 21:34:40 - INFO - __main__ - Step 2188: {'lr': 0.0004999980304411116, 'samples': 420096, 'steps': 2187, 'loss/train': 2.344801902770996} +11/06/2021 21:34:40 - INFO - __main__ - Step 2189: {'lr': 0.0004999980093200157, 'samples': 420288, 'steps': 2188, 'loss/train': 2.7158095836639404} +11/06/2021 21:34:41 - INFO - __main__ - Step 2190: {'lr': 0.0004999979880862745, 'samples': 420480, 'steps': 2189, 'loss/train': 1.4334872961044312} +11/06/2021 21:34:42 - INFO - __main__ - Step 2191: {'lr': 0.0004999979667398882, 'samples': 420672, 'steps': 2190, 'loss/train': 2.5495493412017822} +11/06/2021 21:34:42 - INFO - __main__ - Step 2192: {'lr': 0.0004999979452808565, 'samples': 420864, 'steps': 2191, 'loss/train': 2.356931447982788} +11/06/2021 21:34:42 - INFO - __main__ - Step 2193: {'lr': 0.0004999979237091796, 'samples': 421056, 'steps': 2192, 'loss/train': 2.551086902618408} +11/06/2021 21:34:43 - INFO - __main__ - Step 2194: {'lr': 0.0004999979020248577, 'samples': 421248, 'steps': 2193, 'loss/train': 2.4983091354370117} +11/06/2021 21:34:43 - INFO - __main__ - Step 2195: {'lr': 0.0004999978802278904, 'samples': 421440, 'steps': 2194, 'loss/train': 2.6009490489959717} +11/06/2021 21:34:44 - INFO - __main__ - Step 2196: {'lr': 0.000499997858318278, 'samples': 421632, 'steps': 2195, 'loss/train': 2.3032186031341553} +11/06/2021 21:34:45 - INFO - __main__ - Step 2197: {'lr': 0.0004999978362960204, 'samples': 421824, 'steps': 2196, 'loss/train': 2.835674285888672} +11/06/2021 21:34:45 - INFO - __main__ - Step 2198: {'lr': 0.0004999978141611176, 'samples': 422016, 'steps': 2197, 'loss/train': 3.615586042404175} +11/06/2021 21:34:45 - INFO - __main__ - Step 2199: {'lr': 0.0004999977919135696, 'samples': 422208, 'steps': 2198, 'loss/train': 1.8978424072265625} +11/06/2021 21:34:46 - INFO - __main__ - Step 2200: {'lr': 0.0004999977695533766, 'samples': 422400, 'steps': 2199, 'loss/train': 2.526134967803955} +11/06/2021 21:34:47 - INFO - __main__ - Step 2201: {'lr': 0.0004999977470805383, 'samples': 422592, 'steps': 2200, 'loss/train': 2.3798577785491943} +11/06/2021 21:34:47 - INFO - __main__ - Step 2202: {'lr': 0.0004999977244950551, 'samples': 422784, 'steps': 2201, 'loss/train': 2.6443750858306885} +11/06/2021 21:34:47 - INFO - __main__ - Step 2203: {'lr': 0.0004999977017969266, 'samples': 422976, 'steps': 2202, 'loss/train': 1.9695329666137695} +11/06/2021 21:34:48 - INFO - __main__ - Step 2204: {'lr': 0.000499997678986153, 'samples': 423168, 'steps': 2203, 'loss/train': 2.704178810119629} +11/06/2021 21:34:48 - INFO - __main__ - Step 2205: {'lr': 0.0004999976560627344, 'samples': 423360, 'steps': 2204, 'loss/train': 2.8710994720458984} +11/06/2021 21:34:49 - INFO - __main__ - Step 2206: {'lr': 0.0004999976330266707, 'samples': 423552, 'steps': 2205, 'loss/train': 2.6105599403381348} +11/06/2021 21:34:49 - INFO - __main__ - Step 2207: {'lr': 0.0004999976098779618, 'samples': 423744, 'steps': 2206, 'loss/train': 2.541774272918701} +11/06/2021 21:34:50 - INFO - __main__ - Step 2208: {'lr': 0.0004999975866166079, 'samples': 423936, 'steps': 2207, 'loss/train': 2.3094847202301025} +11/06/2021 21:34:50 - INFO - __main__ - Step 2209: {'lr': 0.000499997563242609, 'samples': 424128, 'steps': 2208, 'loss/train': 2.5492539405822754} +11/06/2021 21:34:50 - INFO - __main__ - Step 2210: {'lr': 0.0004999975397559649, 'samples': 424320, 'steps': 2209, 'loss/train': 2.095379114151001} +11/06/2021 21:34:52 - INFO - __main__ - Step 2211: {'lr': 0.000499997516156676, 'samples': 424512, 'steps': 2210, 'loss/train': 2.605085849761963} +11/06/2021 21:34:52 - INFO - __main__ - Step 2212: {'lr': 0.000499997492444742, 'samples': 424704, 'steps': 2211, 'loss/train': 2.455345630645752} +11/06/2021 21:34:52 - INFO - __main__ - Step 2213: {'lr': 0.0004999974686201629, 'samples': 424896, 'steps': 2212, 'loss/train': 2.637754201889038} +11/06/2021 21:34:53 - INFO - __main__ - Step 2214: {'lr': 0.0004999974446829389, 'samples': 425088, 'steps': 2213, 'loss/train': 2.4633007049560547} +11/06/2021 21:34:53 - INFO - __main__ - Step 2215: {'lr': 0.0004999974206330698, 'samples': 425280, 'steps': 2214, 'loss/train': 2.5374715328216553} +11/06/2021 21:34:53 - INFO - __main__ - Step 2216: {'lr': 0.0004999973964705558, 'samples': 425472, 'steps': 2215, 'loss/train': 2.7447330951690674} +11/06/2021 21:34:54 - INFO - __main__ - Step 2217: {'lr': 0.0004999973721953968, 'samples': 425664, 'steps': 2216, 'loss/train': 2.3357722759246826} +11/06/2021 21:34:55 - INFO - __main__ - Step 2218: {'lr': 0.0004999973478075928, 'samples': 425856, 'steps': 2217, 'loss/train': 2.6798555850982666} +11/06/2021 21:34:55 - INFO - __main__ - Step 2219: {'lr': 0.0004999973233071438, 'samples': 426048, 'steps': 2218, 'loss/train': 2.2830727100372314} +11/06/2021 21:34:55 - INFO - __main__ - Step 2220: {'lr': 0.00049999729869405, 'samples': 426240, 'steps': 2219, 'loss/train': 2.466994524002075} +11/06/2021 21:34:56 - INFO - __main__ - Step 2221: {'lr': 0.0004999972739683113, 'samples': 426432, 'steps': 2220, 'loss/train': 2.3057074546813965} +11/06/2021 21:34:57 - INFO - __main__ - Step 2222: {'lr': 0.0004999972491299276, 'samples': 426624, 'steps': 2221, 'loss/train': 2.5645909309387207} +11/06/2021 21:34:57 - INFO - __main__ - Step 2223: {'lr': 0.000499997224178899, 'samples': 426816, 'steps': 2222, 'loss/train': 2.493025064468384} +11/06/2021 21:34:57 - INFO - __main__ - Step 2224: {'lr': 0.0004999971991152256, 'samples': 427008, 'steps': 2223, 'loss/train': 3.2061784267425537} +11/06/2021 21:34:58 - INFO - __main__ - Step 2225: {'lr': 0.0004999971739389072, 'samples': 427200, 'steps': 2224, 'loss/train': 2.114089250564575} +11/06/2021 21:34:58 - INFO - __main__ - Step 2226: {'lr': 0.000499997148649944, 'samples': 427392, 'steps': 2225, 'loss/train': 2.6324121952056885} +11/06/2021 21:34:59 - INFO - __main__ - Step 2227: {'lr': 0.0004999971232483359, 'samples': 427584, 'steps': 2226, 'loss/train': 2.3817732334136963} +11/06/2021 21:34:59 - INFO - __main__ - Step 2228: {'lr': 0.0004999970977340829, 'samples': 427776, 'steps': 2227, 'loss/train': 2.323068380355835} +11/06/2021 21:35:00 - INFO - __main__ - Step 2229: {'lr': 0.0004999970721071852, 'samples': 427968, 'steps': 2228, 'loss/train': 2.610438585281372} +11/06/2021 21:35:00 - INFO - __main__ - Step 2230: {'lr': 0.0004999970463676427, 'samples': 428160, 'steps': 2229, 'loss/train': 2.492368221282959} +11/06/2021 21:35:00 - INFO - __main__ - Step 2231: {'lr': 0.0004999970205154553, 'samples': 428352, 'steps': 2230, 'loss/train': 2.369539499282837} +11/06/2021 21:35:02 - INFO - __main__ - Step 2232: {'lr': 0.000499996994550623, 'samples': 428544, 'steps': 2231, 'loss/train': 2.712465524673462} +11/06/2021 21:35:02 - INFO - __main__ - Step 2233: {'lr': 0.000499996968473146, 'samples': 428736, 'steps': 2232, 'loss/train': 3.136364221572876} +11/06/2021 21:35:02 - INFO - __main__ - Step 2234: {'lr': 0.0004999969422830242, 'samples': 428928, 'steps': 2233, 'loss/train': 1.8193436861038208} +11/06/2021 21:35:03 - INFO - __main__ - Step 2235: {'lr': 0.0004999969159802577, 'samples': 429120, 'steps': 2234, 'loss/train': 2.6638810634613037} +11/06/2021 21:35:03 - INFO - __main__ - Step 2236: {'lr': 0.0004999968895648464, 'samples': 429312, 'steps': 2235, 'loss/train': 2.946650505065918} +11/06/2021 21:35:03 - INFO - __main__ - Step 2237: {'lr': 0.0004999968630367905, 'samples': 429504, 'steps': 2236, 'loss/train': 1.9133739471435547} +11/06/2021 21:35:04 - INFO - __main__ - Step 2238: {'lr': 0.0004999968363960897, 'samples': 429696, 'steps': 2237, 'loss/train': 2.461745023727417} +11/06/2021 21:35:05 - INFO - __main__ - Step 2239: {'lr': 0.0004999968096427443, 'samples': 429888, 'steps': 2238, 'loss/train': 1.956204891204834} +11/06/2021 21:35:05 - INFO - __main__ - Step 2240: {'lr': 0.0004999967827767541, 'samples': 430080, 'steps': 2239, 'loss/train': 2.4149010181427} +11/06/2021 21:35:05 - INFO - __main__ - Step 2241: {'lr': 0.0004999967557981192, 'samples': 430272, 'steps': 2240, 'loss/train': 2.339151382446289} +11/06/2021 21:35:06 - INFO - __main__ - Step 2242: {'lr': 0.0004999967287068396, 'samples': 430464, 'steps': 2241, 'loss/train': 1.5045028924942017} +11/06/2021 21:35:07 - INFO - __main__ - Step 2243: {'lr': 0.0004999967015029155, 'samples': 430656, 'steps': 2242, 'loss/train': 2.4464919567108154} +11/06/2021 21:35:07 - INFO - __main__ - Step 2244: {'lr': 0.0004999966741863467, 'samples': 430848, 'steps': 2243, 'loss/train': 2.7989583015441895} +11/06/2021 21:35:07 - INFO - __main__ - Step 2245: {'lr': 0.000499996646757133, 'samples': 431040, 'steps': 2244, 'loss/train': 2.849099636077881} +11/06/2021 21:35:08 - INFO - __main__ - Step 2246: {'lr': 0.0004999966192152749, 'samples': 431232, 'steps': 2245, 'loss/train': 2.3336470127105713} +11/06/2021 21:35:08 - INFO - __main__ - Step 2247: {'lr': 0.0004999965915607722, 'samples': 431424, 'steps': 2246, 'loss/train': 1.3028373718261719} +11/06/2021 21:35:09 - INFO - __main__ - Step 2248: {'lr': 0.0004999965637936248, 'samples': 431616, 'steps': 2247, 'loss/train': 2.4899795055389404} +11/06/2021 21:35:10 - INFO - __main__ - Step 2249: {'lr': 0.0004999965359138329, 'samples': 431808, 'steps': 2248, 'loss/train': 3.0825843811035156} +11/06/2021 21:35:10 - INFO - __main__ - Step 2250: {'lr': 0.0004999965079213964, 'samples': 432000, 'steps': 2249, 'loss/train': 2.510723352432251} +11/06/2021 21:35:10 - INFO - __main__ - Step 2251: {'lr': 0.0004999964798163152, 'samples': 432192, 'steps': 2250, 'loss/train': 2.384847640991211} +11/06/2021 21:35:11 - INFO - __main__ - Step 2252: {'lr': 0.0004999964515985896, 'samples': 432384, 'steps': 2251, 'loss/train': 2.7811596393585205} +11/06/2021 21:35:12 - INFO - __main__ - Step 2253: {'lr': 0.0004999964232682194, 'samples': 432576, 'steps': 2252, 'loss/train': 3.195866823196411} +11/06/2021 21:35:12 - INFO - __main__ - Step 2254: {'lr': 0.0004999963948252046, 'samples': 432768, 'steps': 2253, 'loss/train': 1.684893012046814} +11/06/2021 21:35:12 - INFO - __main__ - Step 2255: {'lr': 0.0004999963662695453, 'samples': 432960, 'steps': 2254, 'loss/train': 2.470139265060425} +11/06/2021 21:35:13 - INFO - __main__ - Step 2256: {'lr': 0.0004999963376012416, 'samples': 433152, 'steps': 2255, 'loss/train': 2.2551157474517822} +11/06/2021 21:35:13 - INFO - __main__ - Step 2257: {'lr': 0.0004999963088202934, 'samples': 433344, 'steps': 2256, 'loss/train': 1.778255581855774} +11/06/2021 21:35:13 - INFO - __main__ - Step 2258: {'lr': 0.0004999962799267006, 'samples': 433536, 'steps': 2257, 'loss/train': 2.4314968585968018} +11/06/2021 21:35:14 - INFO - __main__ - Step 2259: {'lr': 0.0004999962509204634, 'samples': 433728, 'steps': 2258, 'loss/train': 2.8687584400177} +11/06/2021 21:35:15 - INFO - __main__ - Step 2260: {'lr': 0.0004999962218015818, 'samples': 433920, 'steps': 2259, 'loss/train': 2.5391645431518555} +11/06/2021 21:35:15 - INFO - __main__ - Step 2261: {'lr': 0.0004999961925700557, 'samples': 434112, 'steps': 2260, 'loss/train': 2.284990072250366} +11/06/2021 21:35:15 - INFO - __main__ - Step 2262: {'lr': 0.0004999961632258851, 'samples': 434304, 'steps': 2261, 'loss/train': 2.2912981510162354} +11/06/2021 21:35:16 - INFO - __main__ - Step 2263: {'lr': 0.0004999961337690703, 'samples': 434496, 'steps': 2262, 'loss/train': 2.5647494792938232} +11/06/2021 21:35:17 - INFO - __main__ - Step 2264: {'lr': 0.0004999961041996109, 'samples': 434688, 'steps': 2263, 'loss/train': 2.3833937644958496} +11/06/2021 21:35:17 - INFO - __main__ - Step 2265: {'lr': 0.0004999960745175071, 'samples': 434880, 'steps': 2264, 'loss/train': 2.4869725704193115} +11/06/2021 21:35:18 - INFO - __main__ - Step 2266: {'lr': 0.0004999960447227591, 'samples': 435072, 'steps': 2265, 'loss/train': 2.0234827995300293} +11/06/2021 21:35:18 - INFO - __main__ - Step 2267: {'lr': 0.0004999960148153667, 'samples': 435264, 'steps': 2266, 'loss/train': 2.4819018840789795} +11/06/2021 21:35:18 - INFO - __main__ - Step 2268: {'lr': 0.0004999959847953299, 'samples': 435456, 'steps': 2267, 'loss/train': 1.9739242792129517} +11/06/2021 21:35:19 - INFO - __main__ - Step 2269: {'lr': 0.0004999959546626487, 'samples': 435648, 'steps': 2268, 'loss/train': 2.5445456504821777} +11/06/2021 21:35:20 - INFO - __main__ - Step 2270: {'lr': 0.0004999959244173232, 'samples': 435840, 'steps': 2269, 'loss/train': 1.6040853261947632} +11/06/2021 21:35:20 - INFO - __main__ - Step 2271: {'lr': 0.0004999958940593535, 'samples': 436032, 'steps': 2270, 'loss/train': 2.391418218612671} +11/06/2021 21:35:20 - INFO - __main__ - Step 2272: {'lr': 0.0004999958635887394, 'samples': 436224, 'steps': 2271, 'loss/train': 2.7278921604156494} +11/06/2021 21:35:21 - INFO - __main__ - Step 2273: {'lr': 0.0004999958330054811, 'samples': 436416, 'steps': 2272, 'loss/train': 2.206878900527954} +11/06/2021 21:35:21 - INFO - __main__ - Step 2274: {'lr': 0.0004999958023095785, 'samples': 436608, 'steps': 2273, 'loss/train': 2.4823598861694336} +11/06/2021 21:35:22 - INFO - __main__ - Step 2275: {'lr': 0.0004999957715010317, 'samples': 436800, 'steps': 2274, 'loss/train': 2.0036473274230957} +11/06/2021 21:35:22 - INFO - __main__ - Step 2276: {'lr': 0.0004999957405798405, 'samples': 436992, 'steps': 2275, 'loss/train': 2.6134819984436035} +11/06/2021 21:35:23 - INFO - __main__ - Step 2277: {'lr': 0.0004999957095460052, 'samples': 437184, 'steps': 2276, 'loss/train': 2.5736441612243652} +11/06/2021 21:35:23 - INFO - __main__ - Step 2278: {'lr': 0.0004999956783995257, 'samples': 437376, 'steps': 2277, 'loss/train': 2.585498809814453} +11/06/2021 21:35:23 - INFO - __main__ - Step 2279: {'lr': 0.0004999956471404021, 'samples': 437568, 'steps': 2278, 'loss/train': 2.7420217990875244} +11/06/2021 21:35:24 - INFO - __main__ - Step 2280: {'lr': 0.0004999956157686341, 'samples': 437760, 'steps': 2279, 'loss/train': 2.3299975395202637} +11/06/2021 21:35:25 - INFO - __main__ - Step 2281: {'lr': 0.0004999955842842222, 'samples': 437952, 'steps': 2280, 'loss/train': 2.463308334350586} +11/06/2021 21:35:25 - INFO - __main__ - Step 2282: {'lr': 0.0004999955526871659, 'samples': 438144, 'steps': 2281, 'loss/train': 1.7193819284439087} +11/06/2021 21:35:26 - INFO - __main__ - Step 2283: {'lr': 0.0004999955209774656, 'samples': 438336, 'steps': 2282, 'loss/train': 2.3171699047088623} +11/06/2021 21:35:26 - INFO - __main__ - Step 2284: {'lr': 0.0004999954891551211, 'samples': 438528, 'steps': 2283, 'loss/train': 3.057791233062744} +11/06/2021 21:35:27 - INFO - __main__ - Step 2285: {'lr': 0.0004999954572201326, 'samples': 438720, 'steps': 2284, 'loss/train': 2.662093162536621} +11/06/2021 21:35:27 - INFO - __main__ - Step 2286: {'lr': 0.0004999954251724999, 'samples': 438912, 'steps': 2285, 'loss/train': 2.635653495788574} +11/06/2021 21:35:28 - INFO - __main__ - Step 2287: {'lr': 0.0004999953930122231, 'samples': 439104, 'steps': 2286, 'loss/train': 2.4084901809692383} +11/06/2021 21:35:28 - INFO - __main__ - Step 2288: {'lr': 0.0004999953607393023, 'samples': 439296, 'steps': 2287, 'loss/train': 2.4325740337371826} +11/06/2021 21:35:28 - INFO - __main__ - Step 2289: {'lr': 0.0004999953283537374, 'samples': 439488, 'steps': 2288, 'loss/train': 2.2441446781158447} +11/06/2021 21:35:29 - INFO - __main__ - Step 2290: {'lr': 0.0004999952958555285, 'samples': 439680, 'steps': 2289, 'loss/train': 3.243093729019165} +11/06/2021 21:35:30 - INFO - __main__ - Step 2291: {'lr': 0.0004999952632446756, 'samples': 439872, 'steps': 2290, 'loss/train': 2.7363367080688477} +11/06/2021 21:35:30 - INFO - __main__ - Step 2292: {'lr': 0.0004999952305211786, 'samples': 440064, 'steps': 2291, 'loss/train': 1.7157084941864014} +11/06/2021 21:35:31 - INFO - __main__ - Step 2293: {'lr': 0.0004999951976850377, 'samples': 440256, 'steps': 2292, 'loss/train': 1.871019721031189} +11/06/2021 21:35:31 - INFO - __main__ - Step 2294: {'lr': 0.0004999951647362527, 'samples': 440448, 'steps': 2293, 'loss/train': 2.4851877689361572} +11/06/2021 21:35:32 - INFO - __main__ - Step 2295: {'lr': 0.0004999951316748239, 'samples': 440640, 'steps': 2294, 'loss/train': 2.7389845848083496} +11/06/2021 21:35:32 - INFO - __main__ - Step 2296: {'lr': 0.0004999950985007511, 'samples': 440832, 'steps': 2295, 'loss/train': 1.447107195854187} +11/06/2021 21:35:33 - INFO - __main__ - Step 2297: {'lr': 0.0004999950652140343, 'samples': 441024, 'steps': 2296, 'loss/train': 2.8587417602539062} +11/06/2021 21:35:33 - INFO - __main__ - Step 2298: {'lr': 0.0004999950318146737, 'samples': 441216, 'steps': 2297, 'loss/train': 2.5910117626190186} +11/06/2021 21:35:33 - INFO - __main__ - Step 2299: {'lr': 0.0004999949983026691, 'samples': 441408, 'steps': 2298, 'loss/train': 2.3904645442962646} +11/06/2021 21:35:34 - INFO - __main__ - Step 2300: {'lr': 0.0004999949646780205, 'samples': 441600, 'steps': 2299, 'loss/train': 2.857335329055786} +11/06/2021 21:35:35 - INFO - __main__ - Step 2301: {'lr': 0.0004999949309407283, 'samples': 441792, 'steps': 2300, 'loss/train': 2.917921543121338} +11/06/2021 21:35:35 - INFO - __main__ - Step 2302: {'lr': 0.0004999948970907921, 'samples': 441984, 'steps': 2301, 'loss/train': 2.345691442489624} +11/06/2021 21:35:36 - INFO - __main__ - Step 2303: {'lr': 0.0004999948631282119, 'samples': 442176, 'steps': 2302, 'loss/train': 1.4263627529144287} +11/06/2021 21:35:36 - INFO - __main__ - Step 2304: {'lr': 0.0004999948290529881, 'samples': 442368, 'steps': 2303, 'loss/train': 2.424299955368042} +11/06/2021 21:35:36 - INFO - __main__ - Step 2305: {'lr': 0.0004999947948651204, 'samples': 442560, 'steps': 2304, 'loss/train': 1.874759316444397} +11/06/2021 21:35:37 - INFO - __main__ - Step 2306: {'lr': 0.0004999947605646089, 'samples': 442752, 'steps': 2305, 'loss/train': 2.55169677734375} +11/06/2021 21:35:38 - INFO - __main__ - Step 2307: {'lr': 0.0004999947261514537, 'samples': 442944, 'steps': 2306, 'loss/train': 2.5056583881378174} +11/06/2021 21:35:38 - INFO - __main__ - Step 2308: {'lr': 0.0004999946916256547, 'samples': 443136, 'steps': 2307, 'loss/train': 2.708646535873413} +11/06/2021 21:35:38 - INFO - __main__ - Step 2309: {'lr': 0.0004999946569872118, 'samples': 443328, 'steps': 2308, 'loss/train': 2.174234628677368} +11/06/2021 21:35:39 - INFO - __main__ - Step 2310: {'lr': 0.0004999946222361254, 'samples': 443520, 'steps': 2309, 'loss/train': 2.365739107131958} +11/06/2021 21:35:40 - INFO - __main__ - Step 2311: {'lr': 0.0004999945873723951, 'samples': 443712, 'steps': 2310, 'loss/train': 2.3640260696411133} +11/06/2021 21:35:40 - INFO - __main__ - Step 2312: {'lr': 0.0004999945523960212, 'samples': 443904, 'steps': 2311, 'loss/train': 1.8592215776443481} +11/06/2021 21:35:40 - INFO - __main__ - Step 2313: {'lr': 0.0004999945173070035, 'samples': 444096, 'steps': 2312, 'loss/train': 2.9647116661071777} +11/06/2021 21:35:41 - INFO - __main__ - Step 2314: {'lr': 0.0004999944821053422, 'samples': 444288, 'steps': 2313, 'loss/train': 2.653313636779785} +11/06/2021 21:35:41 - INFO - __main__ - Step 2315: {'lr': 0.0004999944467910372, 'samples': 444480, 'steps': 2314, 'loss/train': 2.4893155097961426} +11/06/2021 21:35:42 - INFO - __main__ - Step 2316: {'lr': 0.0004999944113640887, 'samples': 444672, 'steps': 2315, 'loss/train': 2.724855422973633} +11/06/2021 21:35:43 - INFO - __main__ - Step 2317: {'lr': 0.0004999943758244964, 'samples': 444864, 'steps': 2316, 'loss/train': 2.472731590270996} +11/06/2021 21:35:43 - INFO - __main__ - Step 2318: {'lr': 0.0004999943401722606, 'samples': 445056, 'steps': 2317, 'loss/train': 2.70874285697937} +11/06/2021 21:35:43 - INFO - __main__ - Step 2319: {'lr': 0.0004999943044073813, 'samples': 445248, 'steps': 2318, 'loss/train': 2.925724983215332} +11/06/2021 21:35:44 - INFO - __main__ - Step 2320: {'lr': 0.0004999942685298582, 'samples': 445440, 'steps': 2319, 'loss/train': 2.7367475032806396} +11/06/2021 21:35:44 - INFO - __main__ - Step 2321: {'lr': 0.0004999942325396916, 'samples': 445632, 'steps': 2320, 'loss/train': 2.439120054244995} +11/06/2021 21:35:45 - INFO - __main__ - Step 2322: {'lr': 0.0004999941964368817, 'samples': 445824, 'steps': 2321, 'loss/train': 2.9538588523864746} +11/06/2021 21:35:45 - INFO - __main__ - Step 2323: {'lr': 0.000499994160221428, 'samples': 446016, 'steps': 2322, 'loss/train': 2.5466785430908203} +11/06/2021 21:35:46 - INFO - __main__ - Step 2324: {'lr': 0.0004999941238933308, 'samples': 446208, 'steps': 2323, 'loss/train': 2.833611488342285} +11/06/2021 21:35:46 - INFO - __main__ - Step 2325: {'lr': 0.0004999940874525902, 'samples': 446400, 'steps': 2324, 'loss/train': 2.2067928314208984} +11/06/2021 21:35:46 - INFO - __main__ - Step 2326: {'lr': 0.0004999940508992061, 'samples': 446592, 'steps': 2325, 'loss/train': 2.688612222671509} +11/06/2021 21:35:48 - INFO - __main__ - Step 2327: {'lr': 0.0004999940142331785, 'samples': 446784, 'steps': 2326, 'loss/train': 2.2611327171325684} +11/06/2021 21:35:48 - INFO - __main__ - Step 2328: {'lr': 0.0004999939774545074, 'samples': 446976, 'steps': 2327, 'loss/train': 2.940781593322754} +11/06/2021 21:35:48 - INFO - __main__ - Step 2329: {'lr': 0.000499993940563193, 'samples': 447168, 'steps': 2328, 'loss/train': 1.4350242614746094} +11/06/2021 21:35:49 - INFO - __main__ - Step 2330: {'lr': 0.0004999939035592351, 'samples': 447360, 'steps': 2329, 'loss/train': 1.2856340408325195} +11/06/2021 21:35:49 - INFO - __main__ - Step 2331: {'lr': 0.0004999938664426339, 'samples': 447552, 'steps': 2330, 'loss/train': 2.2000558376312256} +11/06/2021 21:35:50 - INFO - __main__ - Step 2332: {'lr': 0.0004999938292133894, 'samples': 447744, 'steps': 2331, 'loss/train': 2.552149534225464} +11/06/2021 21:35:51 - INFO - __main__ - Step 2333: {'lr': 0.0004999937918715013, 'samples': 447936, 'steps': 2332, 'loss/train': 2.23763370513916} +11/06/2021 21:35:51 - INFO - __main__ - Step 2334: {'lr': 0.00049999375441697, 'samples': 448128, 'steps': 2333, 'loss/train': 2.5193448066711426} +11/06/2021 21:35:51 - INFO - __main__ - Step 2335: {'lr': 0.0004999937168497954, 'samples': 448320, 'steps': 2334, 'loss/train': 2.982269763946533} +11/06/2021 21:35:52 - INFO - __main__ - Step 2336: {'lr': 0.0004999936791699773, 'samples': 448512, 'steps': 2335, 'loss/train': 2.2376298904418945} +11/06/2021 21:35:53 - INFO - __main__ - Step 2337: {'lr': 0.0004999936413775161, 'samples': 448704, 'steps': 2336, 'loss/train': 2.544750928878784} +11/06/2021 21:35:53 - INFO - __main__ - Step 2338: {'lr': 0.0004999936034724115, 'samples': 448896, 'steps': 2337, 'loss/train': 2.562856912612915} +11/06/2021 21:35:53 - INFO - __main__ - Step 2339: {'lr': 0.0004999935654546638, 'samples': 449088, 'steps': 2338, 'loss/train': 2.4741744995117188} +11/06/2021 21:35:54 - INFO - __main__ - Step 2340: {'lr': 0.0004999935273242727, 'samples': 449280, 'steps': 2339, 'loss/train': 2.637646198272705} +11/06/2021 21:35:54 - INFO - __main__ - Step 2341: {'lr': 0.0004999934890812384, 'samples': 449472, 'steps': 2340, 'loss/train': 2.313438892364502} +11/06/2021 21:35:55 - INFO - __main__ - Step 2342: {'lr': 0.0004999934507255609, 'samples': 449664, 'steps': 2341, 'loss/train': 1.6301710605621338} +11/06/2021 21:35:55 - INFO - __main__ - Step 2343: {'lr': 0.0004999934122572403, 'samples': 449856, 'steps': 2342, 'loss/train': 2.490684747695923} +11/06/2021 21:35:56 - INFO - __main__ - Step 2344: {'lr': 0.0004999933736762763, 'samples': 450048, 'steps': 2343, 'loss/train': 2.5411455631256104} +11/06/2021 21:35:56 - INFO - __main__ - Step 2345: {'lr': 0.0004999933349826694, 'samples': 450240, 'steps': 2344, 'loss/train': 2.634213924407959} +11/06/2021 21:35:57 - INFO - __main__ - Step 2346: {'lr': 0.0004999932961764192, 'samples': 450432, 'steps': 2345, 'loss/train': 2.2040252685546875} +11/06/2021 21:35:58 - INFO - __main__ - Step 2347: {'lr': 0.000499993257257526, 'samples': 450624, 'steps': 2346, 'loss/train': 3.1868784427642822} +11/06/2021 21:35:58 - INFO - __main__ - Step 2348: {'lr': 0.0004999932182259897, 'samples': 450816, 'steps': 2347, 'loss/train': 2.624990940093994} +11/06/2021 21:35:58 - INFO - __main__ - Step 2349: {'lr': 0.0004999931790818102, 'samples': 451008, 'steps': 2348, 'loss/train': 2.1832830905914307} +11/06/2021 21:35:59 - INFO - __main__ - Step 2350: {'lr': 0.0004999931398249876, 'samples': 451200, 'steps': 2349, 'loss/train': 1.3503772020339966} +11/06/2021 21:35:59 - INFO - __main__ - Step 2351: {'lr': 0.0004999931004555221, 'samples': 451392, 'steps': 2350, 'loss/train': 2.434903383255005} +11/06/2021 21:36:00 - INFO - __main__ - Step 2352: {'lr': 0.0004999930609734135, 'samples': 451584, 'steps': 2351, 'loss/train': 1.9292891025543213} +11/06/2021 21:36:01 - INFO - __main__ - Step 2353: {'lr': 0.0004999930213786619, 'samples': 451776, 'steps': 2352, 'loss/train': 2.576533555984497} +11/06/2021 21:36:01 - INFO - __main__ - Step 2354: {'lr': 0.0004999929816712672, 'samples': 451968, 'steps': 2353, 'loss/train': 2.6374588012695312} +11/06/2021 21:36:01 - INFO - __main__ - Step 2355: {'lr': 0.0004999929418512296, 'samples': 452160, 'steps': 2354, 'loss/train': 2.645233392715454} +11/06/2021 21:36:02 - INFO - __main__ - Step 2356: {'lr': 0.0004999929019185491, 'samples': 452352, 'steps': 2355, 'loss/train': 2.3898088932037354} +11/06/2021 21:36:02 - INFO - __main__ - Step 2357: {'lr': 0.0004999928618732256, 'samples': 452544, 'steps': 2356, 'loss/train': 2.8378491401672363} +11/06/2021 21:36:03 - INFO - __main__ - Step 2358: {'lr': 0.0004999928217152591, 'samples': 452736, 'steps': 2357, 'loss/train': 2.8093080520629883} +11/06/2021 21:36:03 - INFO - __main__ - Step 2359: {'lr': 0.0004999927814446498, 'samples': 452928, 'steps': 2358, 'loss/train': 2.382434844970703} +11/06/2021 21:36:04 - INFO - __main__ - Step 2360: {'lr': 0.0004999927410613975, 'samples': 453120, 'steps': 2359, 'loss/train': 2.509754180908203} +11/06/2021 21:36:04 - INFO - __main__ - Step 2361: {'lr': 0.0004999927005655024, 'samples': 453312, 'steps': 2360, 'loss/train': 2.2279305458068848} +11/06/2021 21:36:04 - INFO - __main__ - Step 2362: {'lr': 0.0004999926599569644, 'samples': 453504, 'steps': 2361, 'loss/train': 2.2018115520477295} +11/06/2021 21:36:05 - INFO - __main__ - Step 2363: {'lr': 0.0004999926192357836, 'samples': 453696, 'steps': 2362, 'loss/train': 2.667649269104004} +11/06/2021 21:36:06 - INFO - __main__ - Step 2364: {'lr': 0.00049999257840196, 'samples': 453888, 'steps': 2363, 'loss/train': 1.9997769594192505} +11/06/2021 21:36:06 - INFO - __main__ - Step 2365: {'lr': 0.0004999925374554936, 'samples': 454080, 'steps': 2364, 'loss/train': 2.3278563022613525} +11/06/2021 21:36:06 - INFO - __main__ - Step 2366: {'lr': 0.0004999924963963845, 'samples': 454272, 'steps': 2365, 'loss/train': 2.7401719093322754} +11/06/2021 21:36:07 - INFO - __main__ - Step 2367: {'lr': 0.0004999924552246324, 'samples': 454464, 'steps': 2366, 'loss/train': 2.5451650619506836} +11/06/2021 21:36:08 - INFO - __main__ - Step 2368: {'lr': 0.0004999924139402378, 'samples': 454656, 'steps': 2367, 'loss/train': 2.171853542327881} +11/06/2021 21:36:08 - INFO - __main__ - Step 2369: {'lr': 0.0004999923725432004, 'samples': 454848, 'steps': 2368, 'loss/train': 2.3794937133789062} +11/06/2021 21:36:09 - INFO - __main__ - Step 2370: {'lr': 0.0004999923310335202, 'samples': 455040, 'steps': 2369, 'loss/train': 2.2186713218688965} +11/06/2021 21:36:09 - INFO - __main__ - Step 2371: {'lr': 0.0004999922894111975, 'samples': 455232, 'steps': 2370, 'loss/train': 2.5309088230133057} +11/06/2021 21:36:09 - INFO - __main__ - Step 2372: {'lr': 0.000499992247676232, 'samples': 455424, 'steps': 2371, 'loss/train': 2.399653196334839} +11/06/2021 21:36:10 - INFO - __main__ - Step 2373: {'lr': 0.0004999922058286238, 'samples': 455616, 'steps': 2372, 'loss/train': 2.432457208633423} +11/06/2021 21:36:11 - INFO - __main__ - Step 2374: {'lr': 0.0004999921638683731, 'samples': 455808, 'steps': 2373, 'loss/train': 2.936699390411377} +11/06/2021 21:36:11 - INFO - __main__ - Step 2375: {'lr': 0.0004999921217954797, 'samples': 456000, 'steps': 2374, 'loss/train': 2.8602395057678223} +11/06/2021 21:36:11 - INFO - __main__ - Step 2376: {'lr': 0.0004999920796099437, 'samples': 456192, 'steps': 2375, 'loss/train': 2.113866090774536} +11/06/2021 21:36:12 - INFO - __main__ - Step 2377: {'lr': 0.0004999920373117652, 'samples': 456384, 'steps': 2376, 'loss/train': 2.382596492767334} +11/06/2021 21:36:13 - INFO - __main__ - Step 2378: {'lr': 0.0004999919949009442, 'samples': 456576, 'steps': 2377, 'loss/train': 1.9662163257598877} +11/06/2021 21:36:13 - INFO - __main__ - Step 2379: {'lr': 0.0004999919523774806, 'samples': 456768, 'steps': 2378, 'loss/train': 2.765549659729004} +11/06/2021 21:36:13 - INFO - __main__ - Step 2380: {'lr': 0.0004999919097413743, 'samples': 456960, 'steps': 2379, 'loss/train': 2.0128252506256104} +11/06/2021 21:36:14 - INFO - __main__ - Step 2381: {'lr': 0.0004999918669926258, 'samples': 457152, 'steps': 2380, 'loss/train': 2.4427826404571533} +11/06/2021 21:36:14 - INFO - __main__ - Step 2382: {'lr': 0.0004999918241312346, 'samples': 457344, 'steps': 2381, 'loss/train': 3.2769882678985596} +11/06/2021 21:36:15 - INFO - __main__ - Step 2383: {'lr': 0.0004999917811572011, 'samples': 457536, 'steps': 2382, 'loss/train': 2.264770030975342} +11/06/2021 21:36:16 - INFO - __main__ - Step 2384: {'lr': 0.000499991738070525, 'samples': 457728, 'steps': 2383, 'loss/train': 2.820688247680664} +11/06/2021 21:36:16 - INFO - __main__ - Step 2385: {'lr': 0.0004999916948712066, 'samples': 457920, 'steps': 2384, 'loss/train': 2.739671230316162} +11/06/2021 21:36:16 - INFO - __main__ - Step 2386: {'lr': 0.0004999916515592458, 'samples': 458112, 'steps': 2385, 'loss/train': 2.355753183364868} +11/06/2021 21:36:17 - INFO - __main__ - Step 2387: {'lr': 0.0004999916081346426, 'samples': 458304, 'steps': 2386, 'loss/train': 2.6739003658294678} +11/06/2021 21:36:17 - INFO - __main__ - Step 2388: {'lr': 0.000499991564597397, 'samples': 458496, 'steps': 2387, 'loss/train': 2.985884189605713} +11/06/2021 21:36:18 - INFO - __main__ - Step 2389: {'lr': 0.0004999915209475091, 'samples': 458688, 'steps': 2388, 'loss/train': 2.5510177612304688} +11/06/2021 21:36:18 - INFO - __main__ - Step 2390: {'lr': 0.0004999914771849788, 'samples': 458880, 'steps': 2389, 'loss/train': 2.628279447555542} +11/06/2021 21:36:19 - INFO - __main__ - Step 2391: {'lr': 0.0004999914333098063, 'samples': 459072, 'steps': 2390, 'loss/train': 2.3192155361175537} +11/06/2021 21:36:19 - INFO - __main__ - Step 2392: {'lr': 0.0004999913893219915, 'samples': 459264, 'steps': 2391, 'loss/train': 2.4803824424743652} +11/06/2021 21:36:19 - INFO - __main__ - Step 2393: {'lr': 0.0004999913452215345, 'samples': 459456, 'steps': 2392, 'loss/train': 2.0477797985076904} +11/06/2021 21:36:20 - INFO - __main__ - Step 2394: {'lr': 0.0004999913010084351, 'samples': 459648, 'steps': 2393, 'loss/train': 2.529292583465576} +11/06/2021 21:36:21 - INFO - __main__ - Step 2395: {'lr': 0.0004999912566826935, 'samples': 459840, 'steps': 2394, 'loss/train': 2.484360456466675} +11/06/2021 21:36:21 - INFO - __main__ - Step 2396: {'lr': 0.0004999912122443098, 'samples': 460032, 'steps': 2395, 'loss/train': 2.425950288772583} +11/06/2021 21:36:22 - INFO - __main__ - Step 2397: {'lr': 0.0004999911676932838, 'samples': 460224, 'steps': 2396, 'loss/train': 2.7710964679718018} +11/06/2021 21:36:22 - INFO - __main__ - Step 2398: {'lr': 0.0004999911230296158, 'samples': 460416, 'steps': 2397, 'loss/train': 2.69278883934021} +11/06/2021 21:36:23 - INFO - __main__ - Step 2399: {'lr': 0.0004999910782533055, 'samples': 460608, 'steps': 2398, 'loss/train': 2.1563870906829834} +11/06/2021 21:36:23 - INFO - __main__ - Step 2400: {'lr': 0.0004999910333643531, 'samples': 460800, 'steps': 2399, 'loss/train': 2.21958327293396} +11/06/2021 21:36:24 - INFO - __main__ - Step 2401: {'lr': 0.0004999909883627587, 'samples': 460992, 'steps': 2400, 'loss/train': 2.3043596744537354} +11/06/2021 21:36:24 - INFO - __main__ - Step 2402: {'lr': 0.0004999909432485221, 'samples': 461184, 'steps': 2401, 'loss/train': 2.142707586288452} +11/06/2021 21:36:24 - INFO - __main__ - Step 2403: {'lr': 0.0004999908980216436, 'samples': 461376, 'steps': 2402, 'loss/train': 2.6707916259765625} +11/06/2021 21:36:25 - INFO - __main__ - Step 2404: {'lr': 0.0004999908526821229, 'samples': 461568, 'steps': 2403, 'loss/train': 2.7008554935455322} +11/06/2021 21:36:26 - INFO - __main__ - Step 2405: {'lr': 0.0004999908072299602, 'samples': 461760, 'steps': 2404, 'loss/train': 2.4561195373535156} +11/06/2021 21:36:26 - INFO - __main__ - Step 2406: {'lr': 0.0004999907616651556, 'samples': 461952, 'steps': 2405, 'loss/train': 2.6300549507141113} +11/06/2021 21:36:26 - INFO - __main__ - Step 2407: {'lr': 0.000499990715987709, 'samples': 462144, 'steps': 2406, 'loss/train': 2.5278778076171875} +11/06/2021 21:36:27 - INFO - __main__ - Step 2408: {'lr': 0.0004999906701976203, 'samples': 462336, 'steps': 2407, 'loss/train': 2.5817818641662598} +11/06/2021 21:36:28 - INFO - __main__ - Step 2409: {'lr': 0.0004999906242948898, 'samples': 462528, 'steps': 2408, 'loss/train': 2.7424280643463135} +11/06/2021 21:36:28 - INFO - __main__ - Step 2410: {'lr': 0.0004999905782795173, 'samples': 462720, 'steps': 2409, 'loss/train': 2.3306918144226074} +11/06/2021 21:36:29 - INFO - __main__ - Step 2411: {'lr': 0.000499990532151503, 'samples': 462912, 'steps': 2410, 'loss/train': 2.3240315914154053} +11/06/2021 21:36:29 - INFO - __main__ - Step 2412: {'lr': 0.0004999904859108467, 'samples': 463104, 'steps': 2411, 'loss/train': 2.3780782222747803} +11/06/2021 21:36:29 - INFO - __main__ - Step 2413: {'lr': 0.0004999904395575486, 'samples': 463296, 'steps': 2412, 'loss/train': 2.3109028339385986} +11/06/2021 21:36:30 - INFO - __main__ - Step 2414: {'lr': 0.0004999903930916087, 'samples': 463488, 'steps': 2413, 'loss/train': 2.878998279571533} +11/06/2021 21:36:31 - INFO - __main__ - Step 2415: {'lr': 0.000499990346513027, 'samples': 463680, 'steps': 2414, 'loss/train': 2.0418524742126465} +11/06/2021 21:36:31 - INFO - __main__ - Step 2416: {'lr': 0.0004999902998218034, 'samples': 463872, 'steps': 2415, 'loss/train': 2.2002334594726562} +11/06/2021 21:36:31 - INFO - __main__ - Step 2417: {'lr': 0.000499990253017938, 'samples': 464064, 'steps': 2416, 'loss/train': 2.537015438079834} +11/06/2021 21:36:32 - INFO - __main__ - Step 2418: {'lr': 0.0004999902061014311, 'samples': 464256, 'steps': 2417, 'loss/train': 2.3986918926239014} +11/06/2021 21:36:32 - INFO - __main__ - Step 2419: {'lr': 0.0004999901590722823, 'samples': 464448, 'steps': 2418, 'loss/train': 2.3698606491088867} +11/06/2021 21:36:33 - INFO - __main__ - Step 2420: {'lr': 0.0004999901119304919, 'samples': 464640, 'steps': 2419, 'loss/train': 2.4910922050476074} +11/06/2021 21:36:33 - INFO - __main__ - Step 2421: {'lr': 0.0004999900646760597, 'samples': 464832, 'steps': 2420, 'loss/train': 2.2482521533966064} +11/06/2021 21:36:34 - INFO - __main__ - Step 2422: {'lr': 0.0004999900173089858, 'samples': 465024, 'steps': 2421, 'loss/train': 3.0635385513305664} +11/06/2021 21:36:34 - INFO - __main__ - Step 2423: {'lr': 0.0004999899698292703, 'samples': 465216, 'steps': 2422, 'loss/train': 2.6223621368408203} +11/06/2021 21:36:35 - INFO - __main__ - Step 2424: {'lr': 0.0004999899222369132, 'samples': 465408, 'steps': 2423, 'loss/train': 2.0457282066345215} +11/06/2021 21:36:35 - INFO - __main__ - Step 2425: {'lr': 0.0004999898745319145, 'samples': 465600, 'steps': 2424, 'loss/train': 2.419081449508667} +11/06/2021 21:36:36 - INFO - __main__ - Step 2426: {'lr': 0.0004999898267142741, 'samples': 465792, 'steps': 2425, 'loss/train': 2.6468558311462402} +11/06/2021 21:36:36 - INFO - __main__ - Step 2427: {'lr': 0.0004999897787839923, 'samples': 465984, 'steps': 2426, 'loss/train': 2.8656837940216064} +11/06/2021 21:36:37 - INFO - __main__ - Step 2428: {'lr': 0.000499989730741069, 'samples': 466176, 'steps': 2427, 'loss/train': 2.517319679260254} +11/06/2021 21:36:37 - INFO - __main__ - Step 2429: {'lr': 0.000499989682585504, 'samples': 466368, 'steps': 2428, 'loss/train': 1.5299700498580933} +11/06/2021 21:36:37 - INFO - __main__ - Step 2430: {'lr': 0.0004999896343172976, 'samples': 466560, 'steps': 2429, 'loss/train': 1.4747153520584106} +11/06/2021 21:36:38 - INFO - __main__ - Step 2431: {'lr': 0.0004999895859364498, 'samples': 466752, 'steps': 2430, 'loss/train': 1.975550651550293} +11/06/2021 21:36:39 - INFO - __main__ - Step 2432: {'lr': 0.0004999895374429605, 'samples': 466944, 'steps': 2431, 'loss/train': 2.7396199703216553} +11/06/2021 21:36:39 - INFO - __main__ - Step 2433: {'lr': 0.0004999894888368297, 'samples': 467136, 'steps': 2432, 'loss/train': 2.1605048179626465} +11/06/2021 21:36:39 - INFO - __main__ - Step 2434: {'lr': 0.0004999894401180576, 'samples': 467328, 'steps': 2433, 'loss/train': 2.631399631500244} +11/06/2021 21:36:40 - INFO - __main__ - Step 2435: {'lr': 0.0004999893912866441, 'samples': 467520, 'steps': 2434, 'loss/train': 2.6873080730438232} +11/06/2021 21:36:41 - INFO - __main__ - Step 2436: {'lr': 0.0004999893423425892, 'samples': 467712, 'steps': 2435, 'loss/train': 2.2480852603912354} +11/06/2021 21:36:41 - INFO - __main__ - Step 2437: {'lr': 0.0004999892932858929, 'samples': 467904, 'steps': 2436, 'loss/train': 2.1071290969848633} +11/06/2021 21:36:42 - INFO - __main__ - Step 2438: {'lr': 0.0004999892441165554, 'samples': 468096, 'steps': 2437, 'loss/train': 2.8640754222869873} +11/06/2021 21:36:42 - INFO - __main__ - Step 2439: {'lr': 0.0004999891948345765, 'samples': 468288, 'steps': 2438, 'loss/train': 2.4221558570861816} +11/06/2021 21:36:42 - INFO - __main__ - Step 2440: {'lr': 0.0004999891454399565, 'samples': 468480, 'steps': 2439, 'loss/train': 2.7163968086242676} +11/06/2021 21:36:43 - INFO - __main__ - Step 2441: {'lr': 0.000499989095932695, 'samples': 468672, 'steps': 2440, 'loss/train': 2.371148109436035} +11/06/2021 21:36:44 - INFO - __main__ - Step 2442: {'lr': 0.0004999890463127924, 'samples': 468864, 'steps': 2441, 'loss/train': 2.5758795738220215} +11/06/2021 21:36:44 - INFO - __main__ - Step 2443: {'lr': 0.0004999889965802486, 'samples': 469056, 'steps': 2442, 'loss/train': 2.778921127319336} +11/06/2021 21:36:44 - INFO - __main__ - Step 2444: {'lr': 0.0004999889467350636, 'samples': 469248, 'steps': 2443, 'loss/train': 1.8492902517318726} +11/06/2021 21:36:45 - INFO - __main__ - Step 2445: {'lr': 0.0004999888967772375, 'samples': 469440, 'steps': 2444, 'loss/train': 2.191366672515869} +11/06/2021 21:36:45 - INFO - __main__ - Step 2446: {'lr': 0.0004999888467067702, 'samples': 469632, 'steps': 2445, 'loss/train': 2.458528757095337} +11/06/2021 21:36:46 - INFO - __main__ - Step 2447: {'lr': 0.0004999887965236617, 'samples': 469824, 'steps': 2446, 'loss/train': 2.605138063430786} +11/06/2021 21:36:46 - INFO - __main__ - Step 2448: {'lr': 0.0004999887462279123, 'samples': 470016, 'steps': 2447, 'loss/train': 2.1305642127990723} +11/06/2021 21:36:47 - INFO - __main__ - Step 2449: {'lr': 0.0004999886958195216, 'samples': 470208, 'steps': 2448, 'loss/train': 2.6707427501678467} +11/06/2021 21:36:47 - INFO - __main__ - Step 2450: {'lr': 0.00049998864529849, 'samples': 470400, 'steps': 2449, 'loss/train': 1.814773440361023} +11/06/2021 21:36:47 - INFO - __main__ - Step 2451: {'lr': 0.0004999885946648174, 'samples': 470592, 'steps': 2450, 'loss/train': 2.4460277557373047} +11/06/2021 21:36:48 - INFO - __main__ - Step 2452: {'lr': 0.0004999885439185037, 'samples': 470784, 'steps': 2451, 'loss/train': 2.429396390914917} +11/06/2021 21:36:49 - INFO - __main__ - Step 2453: {'lr': 0.0004999884930595491, 'samples': 470976, 'steps': 2452, 'loss/train': 2.094714879989624} +11/06/2021 21:36:49 - INFO - __main__ - Step 2454: {'lr': 0.0004999884420879534, 'samples': 471168, 'steps': 2453, 'loss/train': 2.2643680572509766} +11/06/2021 21:36:49 - INFO - __main__ - Step 2455: {'lr': 0.000499988391003717, 'samples': 471360, 'steps': 2454, 'loss/train': 2.5920233726501465} +11/06/2021 21:36:50 - INFO - __main__ - Step 2456: {'lr': 0.0004999883398068396, 'samples': 471552, 'steps': 2455, 'loss/train': 3.2174901962280273} +11/06/2021 21:36:51 - INFO - __main__ - Step 2457: {'lr': 0.0004999882884973212, 'samples': 471744, 'steps': 2456, 'loss/train': 2.311598062515259} +11/06/2021 21:36:52 - INFO - __main__ - Step 2458: {'lr': 0.000499988237075162, 'samples': 471936, 'steps': 2457, 'loss/train': 2.8705482482910156} +11/06/2021 21:36:52 - INFO - __main__ - Step 2459: {'lr': 0.000499988185540362, 'samples': 472128, 'steps': 2458, 'loss/train': 3.6789543628692627} +11/06/2021 21:36:52 - INFO - __main__ - Step 2460: {'lr': 0.0004999881338929211, 'samples': 472320, 'steps': 2459, 'loss/train': 2.2293074131011963} +11/06/2021 21:36:53 - INFO - __main__ - Step 2461: {'lr': 0.0004999880821328395, 'samples': 472512, 'steps': 2460, 'loss/train': 2.13460373878479} +11/06/2021 21:36:53 - INFO - __main__ - Step 2462: {'lr': 0.000499988030260117, 'samples': 472704, 'steps': 2461, 'loss/train': 2.2145402431488037} +11/06/2021 21:36:54 - INFO - __main__ - Step 2463: {'lr': 0.0004999879782747539, 'samples': 472896, 'steps': 2462, 'loss/train': 2.412808418273926} +11/06/2021 21:36:55 - INFO - __main__ - Step 2464: {'lr': 0.00049998792617675, 'samples': 473088, 'steps': 2463, 'loss/train': 1.355026125907898} +11/06/2021 21:36:55 - INFO - __main__ - Step 2465: {'lr': 0.0004999878739661053, 'samples': 473280, 'steps': 2464, 'loss/train': 2.797194242477417} +11/06/2021 21:36:55 - INFO - __main__ - Step 2466: {'lr': 0.0004999878216428201, 'samples': 473472, 'steps': 2465, 'loss/train': 3.099053144454956} +11/06/2021 21:36:56 - INFO - __main__ - Step 2467: {'lr': 0.0004999877692068942, 'samples': 473664, 'steps': 2466, 'loss/train': 2.666736602783203} +11/06/2021 21:36:57 - INFO - __main__ - Step 2468: {'lr': 0.0004999877166583276, 'samples': 473856, 'steps': 2467, 'loss/train': 2.2007715702056885} +11/06/2021 21:36:57 - INFO - __main__ - Step 2469: {'lr': 0.0004999876639971204, 'samples': 474048, 'steps': 2468, 'loss/train': 2.5760223865509033} +11/06/2021 21:36:57 - INFO - __main__ - Step 2470: {'lr': 0.0004999876112232726, 'samples': 474240, 'steps': 2469, 'loss/train': 2.2806897163391113} +11/06/2021 21:36:58 - INFO - __main__ - Step 2471: {'lr': 0.0004999875583367844, 'samples': 474432, 'steps': 2470, 'loss/train': 2.3899688720703125} +11/06/2021 21:36:58 - INFO - __main__ - Step 2472: {'lr': 0.0004999875053376555, 'samples': 474624, 'steps': 2471, 'loss/train': 2.720411539077759} +11/06/2021 21:36:59 - INFO - __main__ - Step 2473: {'lr': 0.0004999874522258861, 'samples': 474816, 'steps': 2472, 'loss/train': 2.3538568019866943} +11/06/2021 21:36:59 - INFO - __main__ - Step 2474: {'lr': 0.0004999873990014763, 'samples': 475008, 'steps': 2473, 'loss/train': 2.296961784362793} +11/06/2021 21:37:00 - INFO - __main__ - Step 2475: {'lr': 0.0004999873456644259, 'samples': 475200, 'steps': 2474, 'loss/train': 3.126654624938965} +11/06/2021 21:37:00 - INFO - __main__ - Step 2476: {'lr': 0.0004999872922147352, 'samples': 475392, 'steps': 2475, 'loss/train': 2.8180599212646484} +11/06/2021 21:37:01 - INFO - __main__ - Step 2477: {'lr': 0.0004999872386524041, 'samples': 475584, 'steps': 2476, 'loss/train': 2.209730625152588} +11/06/2021 21:37:02 - INFO - __main__ - Step 2478: {'lr': 0.0004999871849774325, 'samples': 475776, 'steps': 2477, 'loss/train': 2.773592472076416} +11/06/2021 21:37:02 - INFO - __main__ - Step 2479: {'lr': 0.0004999871311898205, 'samples': 475968, 'steps': 2478, 'loss/train': 2.503931760787964} +11/06/2021 21:37:02 - INFO - __main__ - Step 2480: {'lr': 0.0004999870772895683, 'samples': 476160, 'steps': 2479, 'loss/train': 2.848806858062744} +11/06/2021 21:37:03 - INFO - __main__ - Step 2481: {'lr': 0.0004999870232766756, 'samples': 476352, 'steps': 2480, 'loss/train': 2.6014020442962646} +11/06/2021 21:37:03 - INFO - __main__ - Step 2482: {'lr': 0.0004999869691511428, 'samples': 476544, 'steps': 2481, 'loss/train': 2.4127416610717773} +11/06/2021 21:37:04 - INFO - __main__ - Step 2483: {'lr': 0.0004999869149129696, 'samples': 476736, 'steps': 2482, 'loss/train': 1.9022128582000732} +11/06/2021 21:37:04 - INFO - __main__ - Step 2484: {'lr': 0.0004999868605621563, 'samples': 476928, 'steps': 2483, 'loss/train': 2.502490282058716} +11/06/2021 21:37:05 - INFO - __main__ - Step 2485: {'lr': 0.0004999868060987027, 'samples': 477120, 'steps': 2484, 'loss/train': 2.5162899494171143} +11/06/2021 21:37:05 - INFO - __main__ - Step 2486: {'lr': 0.0004999867515226088, 'samples': 477312, 'steps': 2485, 'loss/train': 2.565920829772949} +11/06/2021 21:37:05 - INFO - __main__ - Step 2487: {'lr': 0.0004999866968338748, 'samples': 477504, 'steps': 2486, 'loss/train': 2.152040481567383} +11/06/2021 21:37:07 - INFO - __main__ - Step 2488: {'lr': 0.0004999866420325006, 'samples': 477696, 'steps': 2487, 'loss/train': 2.5506532192230225} +11/06/2021 21:37:07 - INFO - __main__ - Step 2489: {'lr': 0.0004999865871184863, 'samples': 477888, 'steps': 2488, 'loss/train': 2.6349217891693115} +11/06/2021 21:37:07 - INFO - __main__ - Step 2490: {'lr': 0.000499986532091832, 'samples': 478080, 'steps': 2489, 'loss/train': 1.8564928770065308} +11/06/2021 21:37:08 - INFO - __main__ - Step 2491: {'lr': 0.0004999864769525375, 'samples': 478272, 'steps': 2490, 'loss/train': 2.035461664199829} +11/06/2021 21:37:08 - INFO - __main__ - Step 2492: {'lr': 0.000499986421700603, 'samples': 478464, 'steps': 2491, 'loss/train': 2.712242364883423} +11/06/2021 21:37:09 - INFO - __main__ - Step 2493: {'lr': 0.0004999863663360285, 'samples': 478656, 'steps': 2492, 'loss/train': 1.668128490447998} +11/06/2021 21:37:09 - INFO - __main__ - Step 2494: {'lr': 0.000499986310858814, 'samples': 478848, 'steps': 2493, 'loss/train': 2.30643892288208} +11/06/2021 21:37:10 - INFO - __main__ - Step 2495: {'lr': 0.0004999862552689595, 'samples': 479040, 'steps': 2494, 'loss/train': 2.329277992248535} +11/06/2021 21:37:10 - INFO - __main__ - Step 2496: {'lr': 0.000499986199566465, 'samples': 479232, 'steps': 2495, 'loss/train': 2.888967275619507} +11/06/2021 21:37:10 - INFO - __main__ - Step 2497: {'lr': 0.0004999861437513306, 'samples': 479424, 'steps': 2496, 'loss/train': 2.5283238887786865} +11/06/2021 21:37:11 - INFO - __main__ - Step 2498: {'lr': 0.0004999860878235564, 'samples': 479616, 'steps': 2497, 'loss/train': 2.4118523597717285} +11/06/2021 21:37:12 - INFO - __main__ - Step 2499: {'lr': 0.0004999860317831423, 'samples': 479808, 'steps': 2498, 'loss/train': 1.975379228591919} +11/06/2021 21:37:12 - INFO - __main__ - Step 2500: {'lr': 0.0004999859756300883, 'samples': 480000, 'steps': 2499, 'loss/train': 2.776916027069092} +11/06/2021 21:37:13 - INFO - __main__ - Step 2501: {'lr': 0.0004999859193643945, 'samples': 480192, 'steps': 2500, 'loss/train': 1.9438010454177856} +11/06/2021 21:37:13 - INFO - __main__ - Step 2502: {'lr': 0.0004999858629860609, 'samples': 480384, 'steps': 2501, 'loss/train': 2.3400754928588867} +11/06/2021 21:37:14 - INFO - __main__ - Step 2503: {'lr': 0.0004999858064950875, 'samples': 480576, 'steps': 2502, 'loss/train': 2.453505516052246} +11/06/2021 21:37:14 - INFO - __main__ - Step 2504: {'lr': 0.0004999857498914744, 'samples': 480768, 'steps': 2503, 'loss/train': 1.737013339996338} +11/06/2021 21:37:15 - INFO - __main__ - Step 2505: {'lr': 0.0004999856931752215, 'samples': 480960, 'steps': 2504, 'loss/train': 2.44512677192688} +11/06/2021 21:37:15 - INFO - __main__ - Step 2506: {'lr': 0.000499985636346329, 'samples': 481152, 'steps': 2505, 'loss/train': 2.2163236141204834} +11/06/2021 21:37:15 - INFO - __main__ - Step 2507: {'lr': 0.0004999855794047968, 'samples': 481344, 'steps': 2506, 'loss/train': 2.2586050033569336} +11/06/2021 21:37:16 - INFO - __main__ - Step 2508: {'lr': 0.000499985522350625, 'samples': 481536, 'steps': 2507, 'loss/train': 2.6702263355255127} +11/06/2021 21:37:17 - INFO - __main__ - Step 2509: {'lr': 0.0004999854651838134, 'samples': 481728, 'steps': 2508, 'loss/train': 1.7556337118148804} +11/06/2021 21:37:17 - INFO - __main__ - Step 2510: {'lr': 0.0004999854079043624, 'samples': 481920, 'steps': 2509, 'loss/train': 2.5938799381256104} +11/06/2021 21:37:17 - INFO - __main__ - Step 2511: {'lr': 0.0004999853505122718, 'samples': 482112, 'steps': 2510, 'loss/train': 2.314603567123413} +11/06/2021 21:37:18 - INFO - __main__ - Step 2512: {'lr': 0.0004999852930075416, 'samples': 482304, 'steps': 2511, 'loss/train': 3.3958892822265625} +11/06/2021 21:37:18 - INFO - __main__ - Step 2513: {'lr': 0.0004999852353901719, 'samples': 482496, 'steps': 2512, 'loss/train': 2.0846526622772217} +11/06/2021 21:37:19 - INFO - __main__ - Step 2514: {'lr': 0.0004999851776601627, 'samples': 482688, 'steps': 2513, 'loss/train': 2.1145737171173096} +11/06/2021 21:37:19 - INFO - __main__ - Step 2515: {'lr': 0.0004999851198175141, 'samples': 482880, 'steps': 2514, 'loss/train': 2.3666229248046875} +11/06/2021 21:37:20 - INFO - __main__ - Step 2516: {'lr': 0.0004999850618622259, 'samples': 483072, 'steps': 2515, 'loss/train': 1.9783778190612793} +11/06/2021 21:37:20 - INFO - __main__ - Step 2517: {'lr': 0.0004999850037942984, 'samples': 483264, 'steps': 2516, 'loss/train': 1.6819298267364502} +11/06/2021 21:37:21 - INFO - __main__ - Step 2518: {'lr': 0.0004999849456137316, 'samples': 483456, 'steps': 2517, 'loss/train': 2.5427420139312744} +11/06/2021 21:37:22 - INFO - __main__ - Step 2519: {'lr': 0.0004999848873205254, 'samples': 483648, 'steps': 2518, 'loss/train': 1.944232702255249} +11/06/2021 21:37:22 - INFO - __main__ - Step 2520: {'lr': 0.0004999848289146798, 'samples': 483840, 'steps': 2519, 'loss/train': 2.538642644882202} +11/06/2021 21:37:22 - INFO - __main__ - Step 2521: {'lr': 0.0004999847703961948, 'samples': 484032, 'steps': 2520, 'loss/train': 2.035733699798584} +11/06/2021 21:37:23 - INFO - __main__ - Step 2522: {'lr': 0.0004999847117650708, 'samples': 484224, 'steps': 2521, 'loss/train': 2.2497646808624268} +11/06/2021 21:37:23 - INFO - __main__ - Step 2523: {'lr': 0.0004999846530213074, 'samples': 484416, 'steps': 2522, 'loss/train': 2.4687421321868896} +11/06/2021 21:37:24 - INFO - __main__ - Step 2524: {'lr': 0.0004999845941649048, 'samples': 484608, 'steps': 2523, 'loss/train': 2.6273131370544434} +11/06/2021 21:37:25 - INFO - __main__ - Step 2525: {'lr': 0.0004999845351958629, 'samples': 484800, 'steps': 2524, 'loss/train': 2.2162749767303467} +11/06/2021 21:37:25 - INFO - __main__ - Step 2526: {'lr': 0.0004999844761141818, 'samples': 484992, 'steps': 2525, 'loss/train': 2.4674794673919678} +11/06/2021 21:37:25 - INFO - __main__ - Step 2527: {'lr': 0.0004999844169198617, 'samples': 485184, 'steps': 2526, 'loss/train': 2.444234609603882} +11/06/2021 21:37:26 - INFO - __main__ - Step 2528: {'lr': 0.0004999843576129024, 'samples': 485376, 'steps': 2527, 'loss/train': 2.046820640563965} +11/06/2021 21:37:27 - INFO - __main__ - Step 2529: {'lr': 0.000499984298193304, 'samples': 485568, 'steps': 2528, 'loss/train': 3.3430094718933105} +11/06/2021 21:37:27 - INFO - __main__ - Step 2530: {'lr': 0.0004999842386610666, 'samples': 485760, 'steps': 2529, 'loss/train': 2.4798810482025146} +11/06/2021 21:37:27 - INFO - __main__ - Step 2531: {'lr': 0.0004999841790161901, 'samples': 485952, 'steps': 2530, 'loss/train': 2.1105799674987793} +11/06/2021 21:37:28 - INFO - __main__ - Step 2532: {'lr': 0.0004999841192586746, 'samples': 486144, 'steps': 2531, 'loss/train': 2.247392177581787} +11/06/2021 21:37:28 - INFO - __main__ - Step 2533: {'lr': 0.0004999840593885201, 'samples': 486336, 'steps': 2532, 'loss/train': 2.632009983062744} +11/06/2021 21:37:29 - INFO - __main__ - Step 2534: {'lr': 0.0004999839994057266, 'samples': 486528, 'steps': 2533, 'loss/train': 2.2957653999328613} +11/06/2021 21:37:29 - INFO - __main__ - Step 2535: {'lr': 0.0004999839393102943, 'samples': 486720, 'steps': 2534, 'loss/train': 2.15610671043396} +11/06/2021 21:37:30 - INFO - __main__ - Step 2536: {'lr': 0.0004999838791022229, 'samples': 486912, 'steps': 2535, 'loss/train': 1.8324062824249268} +11/06/2021 21:37:30 - INFO - __main__ - Step 2537: {'lr': 0.0004999838187815128, 'samples': 487104, 'steps': 2536, 'loss/train': 2.1403756141662598} +11/06/2021 21:37:30 - INFO - __main__ - Step 2538: {'lr': 0.0004999837583481638, 'samples': 487296, 'steps': 2537, 'loss/train': 2.4630844593048096} +11/06/2021 21:37:31 - INFO - __main__ - Step 2539: {'lr': 0.000499983697802176, 'samples': 487488, 'steps': 2538, 'loss/train': 2.763502836227417} +11/06/2021 21:37:32 - INFO - __main__ - Step 2540: {'lr': 0.0004999836371435494, 'samples': 487680, 'steps': 2539, 'loss/train': 1.6404800415039062} +11/06/2021 21:37:32 - INFO - __main__ - Step 2541: {'lr': 0.000499983576372284, 'samples': 487872, 'steps': 2540, 'loss/train': 0.7703345417976379} +11/06/2021 21:37:32 - INFO - __main__ - Step 2542: {'lr': 0.0004999835154883798, 'samples': 488064, 'steps': 2541, 'loss/train': 2.3808321952819824} +11/06/2021 21:37:33 - INFO - __main__ - Step 2543: {'lr': 0.0004999834544918369, 'samples': 488256, 'steps': 2542, 'loss/train': 1.3541216850280762} +11/06/2021 21:37:33 - INFO - __main__ - Step 2544: {'lr': 0.0004999833933826554, 'samples': 488448, 'steps': 2543, 'loss/train': 2.6432573795318604} +11/06/2021 21:37:34 - INFO - __main__ - Step 2545: {'lr': 0.0004999833321608351, 'samples': 488640, 'steps': 2544, 'loss/train': 2.655363082885742} +11/06/2021 21:37:35 - INFO - __main__ - Step 2546: {'lr': 0.0004999832708263764, 'samples': 488832, 'steps': 2545, 'loss/train': 1.829182744026184} +11/06/2021 21:37:35 - INFO - __main__ - Step 2547: {'lr': 0.000499983209379279, 'samples': 489024, 'steps': 2546, 'loss/train': 2.714189291000366} +11/06/2021 21:37:35 - INFO - __main__ - Step 2548: {'lr': 0.0004999831478195429, 'samples': 489216, 'steps': 2547, 'loss/train': 2.1510307788848877} +11/06/2021 21:37:36 - INFO - __main__ - Step 2549: {'lr': 0.0004999830861471684, 'samples': 489408, 'steps': 2548, 'loss/train': 2.5913808345794678} +11/06/2021 21:37:37 - INFO - __main__ - Step 2550: {'lr': 0.0004999830243621553, 'samples': 489600, 'steps': 2549, 'loss/train': 2.1029839515686035} +11/06/2021 21:37:37 - INFO - __main__ - Step 2551: {'lr': 0.0004999829624645037, 'samples': 489792, 'steps': 2550, 'loss/train': 2.4384331703186035} +11/06/2021 21:37:37 - INFO - __main__ - Step 2552: {'lr': 0.0004999829004542136, 'samples': 489984, 'steps': 2551, 'loss/train': 2.5452609062194824} +11/06/2021 21:37:38 - INFO - __main__ - Step 2553: {'lr': 0.0004999828383312851, 'samples': 490176, 'steps': 2552, 'loss/train': 2.293485403060913} +11/06/2021 21:37:38 - INFO - __main__ - Step 2554: {'lr': 0.0004999827760957182, 'samples': 490368, 'steps': 2553, 'loss/train': 2.1594653129577637} +11/06/2021 21:37:39 - INFO - __main__ - Step 2555: {'lr': 0.000499982713747513, 'samples': 490560, 'steps': 2554, 'loss/train': 2.2348339557647705} +11/06/2021 21:37:39 - INFO - __main__ - Step 2556: {'lr': 0.0004999826512866693, 'samples': 490752, 'steps': 2555, 'loss/train': 2.039029598236084} +11/06/2021 21:37:40 - INFO - __main__ - Step 2557: {'lr': 0.0004999825887131874, 'samples': 490944, 'steps': 2556, 'loss/train': 2.3221940994262695} +11/06/2021 21:37:40 - INFO - __main__ - Step 2558: {'lr': 0.0004999825260270671, 'samples': 491136, 'steps': 2557, 'loss/train': 1.9088735580444336} +11/06/2021 21:37:40 - INFO - __main__ - Step 2559: {'lr': 0.0004999824632283086, 'samples': 491328, 'steps': 2558, 'loss/train': 2.34741473197937} +11/06/2021 21:37:41 - INFO - __main__ - Step 2560: {'lr': 0.0004999824003169119, 'samples': 491520, 'steps': 2559, 'loss/train': 2.832210063934326} +11/06/2021 21:37:42 - INFO - __main__ - Step 2561: {'lr': 0.000499982337292877, 'samples': 491712, 'steps': 2560, 'loss/train': 2.518115758895874} +11/06/2021 21:37:42 - INFO - __main__ - Step 2562: {'lr': 0.0004999822741562038, 'samples': 491904, 'steps': 2561, 'loss/train': 1.5568736791610718} +11/06/2021 21:37:42 - INFO - __main__ - Step 2563: {'lr': 0.0004999822109068925, 'samples': 492096, 'steps': 2562, 'loss/train': 2.128868818283081} +11/06/2021 21:37:43 - INFO - __main__ - Step 2564: {'lr': 0.000499982147544943, 'samples': 492288, 'steps': 2563, 'loss/train': 2.274667739868164} +11/06/2021 21:37:44 - INFO - __main__ - Step 2565: {'lr': 0.0004999820840703554, 'samples': 492480, 'steps': 2564, 'loss/train': 2.438570022583008} +11/06/2021 21:37:44 - INFO - __main__ - Step 2566: {'lr': 0.0004999820204831298, 'samples': 492672, 'steps': 2565, 'loss/train': 1.8974850177764893} +11/06/2021 21:37:44 - INFO - __main__ - Step 2567: {'lr': 0.0004999819567832661, 'samples': 492864, 'steps': 2566, 'loss/train': 1.991250991821289} +11/06/2021 21:37:45 - INFO - __main__ - Step 2568: {'lr': 0.0004999818929707645, 'samples': 493056, 'steps': 2567, 'loss/train': 2.29544734954834} +11/06/2021 21:37:45 - INFO - __main__ - Step 2569: {'lr': 0.0004999818290456249, 'samples': 493248, 'steps': 2568, 'loss/train': 2.5977227687835693} +11/06/2021 21:37:45 - INFO - __main__ - Step 2570: {'lr': 0.0004999817650078474, 'samples': 493440, 'steps': 2569, 'loss/train': 2.2066221237182617} +11/06/2021 21:37:47 - INFO - __main__ - Step 2571: {'lr': 0.0004999817008574318, 'samples': 493632, 'steps': 2570, 'loss/train': 2.1649460792541504} +11/06/2021 21:37:47 - INFO - __main__ - Step 2572: {'lr': 0.0004999816365943784, 'samples': 493824, 'steps': 2571, 'loss/train': 2.5640785694122314} +11/06/2021 21:37:47 - INFO - __main__ - Step 2573: {'lr': 0.000499981572218687, 'samples': 494016, 'steps': 2572, 'loss/train': 2.131150007247925} +11/06/2021 21:37:48 - INFO - __main__ - Step 2574: {'lr': 0.0004999815077303579, 'samples': 494208, 'steps': 2573, 'loss/train': 2.548187017440796} +11/06/2021 21:37:48 - INFO - __main__ - Step 2575: {'lr': 0.000499981443129391, 'samples': 494400, 'steps': 2574, 'loss/train': 1.7672605514526367} +11/06/2021 21:37:49 - INFO - __main__ - Step 2576: {'lr': 0.0004999813784157863, 'samples': 494592, 'steps': 2575, 'loss/train': 1.979129433631897} +11/06/2021 21:37:49 - INFO - __main__ - Step 2577: {'lr': 0.0004999813135895438, 'samples': 494784, 'steps': 2576, 'loss/train': 2.5306124687194824} +11/06/2021 21:37:50 - INFO - __main__ - Step 2578: {'lr': 0.0004999812486506637, 'samples': 494976, 'steps': 2577, 'loss/train': 1.985874056816101} +11/06/2021 21:37:50 - INFO - __main__ - Step 2579: {'lr': 0.0004999811835991457, 'samples': 495168, 'steps': 2578, 'loss/train': 2.2465949058532715} +11/06/2021 21:37:50 - INFO - __main__ - Step 2580: {'lr': 0.0004999811184349902, 'samples': 495360, 'steps': 2579, 'loss/train': 1.718479871749878} +11/06/2021 21:37:51 - INFO - __main__ - Step 2581: {'lr': 0.000499981053158197, 'samples': 495552, 'steps': 2580, 'loss/train': 2.3030970096588135} +11/06/2021 21:37:52 - INFO - __main__ - Step 2582: {'lr': 0.0004999809877687662, 'samples': 495744, 'steps': 2581, 'loss/train': 2.4952125549316406} +11/06/2021 21:37:52 - INFO - __main__ - Step 2583: {'lr': 0.0004999809222666978, 'samples': 495936, 'steps': 2582, 'loss/train': 2.9251458644866943} +11/06/2021 21:37:52 - INFO - __main__ - Step 2584: {'lr': 0.0004999808566519919, 'samples': 496128, 'steps': 2583, 'loss/train': 2.0826971530914307} +11/06/2021 21:37:53 - INFO - __main__ - Step 2585: {'lr': 0.0004999807909246485, 'samples': 496320, 'steps': 2584, 'loss/train': 2.6530747413635254} +11/06/2021 21:37:54 - INFO - __main__ - Step 2586: {'lr': 0.0004999807250846676, 'samples': 496512, 'steps': 2585, 'loss/train': 2.023077964782715} +11/06/2021 21:37:54 - INFO - __main__ - Step 2587: {'lr': 0.0004999806591320492, 'samples': 496704, 'steps': 2586, 'loss/train': 2.128833532333374} +11/06/2021 21:37:54 - INFO - __main__ - Step 2588: {'lr': 0.0004999805930667934, 'samples': 496896, 'steps': 2587, 'loss/train': 2.2073006629943848} +11/06/2021 21:37:55 - INFO - __main__ - Step 2589: {'lr': 0.0004999805268889003, 'samples': 497088, 'steps': 2588, 'loss/train': 2.542658567428589} +11/06/2021 21:37:55 - INFO - __main__ - Step 2590: {'lr': 0.0004999804605983697, 'samples': 497280, 'steps': 2589, 'loss/train': 1.7954328060150146} +11/06/2021 21:37:56 - INFO - __main__ - Step 2591: {'lr': 0.0004999803941952018, 'samples': 497472, 'steps': 2590, 'loss/train': 1.970054030418396} +11/06/2021 21:37:57 - INFO - __main__ - Step 2592: {'lr': 0.0004999803276793965, 'samples': 497664, 'steps': 2591, 'loss/train': 2.5273969173431396} +11/06/2021 21:37:57 - INFO - __main__ - Step 2593: {'lr': 0.0004999802610509541, 'samples': 497856, 'steps': 2592, 'loss/train': 2.8750476837158203} +11/06/2021 21:37:57 - INFO - __main__ - Step 2594: {'lr': 0.0004999801943098743, 'samples': 498048, 'steps': 2593, 'loss/train': 2.145956039428711} +11/06/2021 21:37:58 - INFO - __main__ - Step 2595: {'lr': 0.0004999801274561573, 'samples': 498240, 'steps': 2594, 'loss/train': 1.3880176544189453} +11/06/2021 21:37:58 - INFO - __main__ - Step 2596: {'lr': 0.0004999800604898032, 'samples': 498432, 'steps': 2595, 'loss/train': 2.8618476390838623} +11/06/2021 21:37:59 - INFO - __main__ - Step 2597: {'lr': 0.000499979993410812, 'samples': 498624, 'steps': 2596, 'loss/train': 1.0421839952468872} +11/06/2021 21:37:59 - INFO - __main__ - Step 2598: {'lr': 0.0004999799262191835, 'samples': 498816, 'steps': 2597, 'loss/train': 2.2791144847869873} +11/06/2021 21:38:00 - INFO - __main__ - Step 2599: {'lr': 0.0004999798589149179, 'samples': 499008, 'steps': 2598, 'loss/train': 1.718825101852417} +11/06/2021 21:38:00 - INFO - __main__ - Step 2600: {'lr': 0.0004999797914980154, 'samples': 499200, 'steps': 2599, 'loss/train': 2.3873207569122314} +11/06/2021 21:38:01 - INFO - __main__ - Step 2601: {'lr': 0.0004999797239684757, 'samples': 499392, 'steps': 2600, 'loss/train': 1.5167217254638672} +11/06/2021 21:38:02 - INFO - __main__ - Step 2602: {'lr': 0.0004999796563262991, 'samples': 499584, 'steps': 2601, 'loss/train': 2.33709454536438} +11/06/2021 21:38:02 - INFO - __main__ - Step 2603: {'lr': 0.0004999795885714855, 'samples': 499776, 'steps': 2602, 'loss/train': 1.5589454174041748} +11/06/2021 21:38:02 - INFO - __main__ - Step 2604: {'lr': 0.0004999795207040349, 'samples': 499968, 'steps': 2603, 'loss/train': 3.2038750648498535} +11/06/2021 21:38:03 - INFO - __main__ - Step 2605: {'lr': 0.0004999794527239474, 'samples': 500160, 'steps': 2604, 'loss/train': 2.761178731918335} +11/06/2021 21:38:03 - INFO - __main__ - Step 2606: {'lr': 0.000499979384631223, 'samples': 500352, 'steps': 2605, 'loss/train': 2.426281690597534} +11/06/2021 21:38:03 - INFO - __main__ - Step 2607: {'lr': 0.000499979316425862, 'samples': 500544, 'steps': 2606, 'loss/train': 2.246225118637085} +11/06/2021 21:38:04 - INFO - __main__ - Step 2608: {'lr': 0.0004999792481078639, 'samples': 500736, 'steps': 2607, 'loss/train': 1.7112780809402466} +11/06/2021 21:38:05 - INFO - __main__ - Step 2609: {'lr': 0.000499979179677229, 'samples': 500928, 'steps': 2608, 'loss/train': 2.6037216186523438} +11/06/2021 21:38:05 - INFO - __main__ - Step 2610: {'lr': 0.0004999791111339574, 'samples': 501120, 'steps': 2609, 'loss/train': 2.3880434036254883} +11/06/2021 21:38:05 - INFO - __main__ - Step 2611: {'lr': 0.0004999790424780492, 'samples': 501312, 'steps': 2610, 'loss/train': 2.595461368560791} +11/06/2021 21:38:06 - INFO - __main__ - Step 2612: {'lr': 0.0004999789737095041, 'samples': 501504, 'steps': 2611, 'loss/train': 1.1569690704345703} +11/06/2021 21:38:07 - INFO - __main__ - Step 2613: {'lr': 0.0004999789048283224, 'samples': 501696, 'steps': 2612, 'loss/train': 3.0552828311920166} +11/06/2021 21:38:07 - INFO - __main__ - Step 2614: {'lr': 0.0004999788358345041, 'samples': 501888, 'steps': 2613, 'loss/train': 2.318122386932373} +11/06/2021 21:38:08 - INFO - __main__ - Step 2615: {'lr': 0.0004999787667280492, 'samples': 502080, 'steps': 2614, 'loss/train': 2.3980915546417236} +11/06/2021 21:38:08 - INFO - __main__ - Step 2616: {'lr': 0.0004999786975089577, 'samples': 502272, 'steps': 2615, 'loss/train': 4.580399513244629} +11/06/2021 21:38:08 - INFO - __main__ - Step 2617: {'lr': 0.0004999786281772296, 'samples': 502464, 'steps': 2616, 'loss/train': 2.6063055992126465} +11/06/2021 21:38:09 - INFO - __main__ - Step 2618: {'lr': 0.0004999785587328651, 'samples': 502656, 'steps': 2617, 'loss/train': 2.637915849685669} +11/06/2021 21:38:10 - INFO - __main__ - Step 2619: {'lr': 0.0004999784891758641, 'samples': 502848, 'steps': 2618, 'loss/train': 2.712459087371826} +11/06/2021 21:38:10 - INFO - __main__ - Step 2620: {'lr': 0.0004999784195062266, 'samples': 503040, 'steps': 2619, 'loss/train': 1.5384448766708374} +11/06/2021 21:38:10 - INFO - __main__ - Step 2621: {'lr': 0.0004999783497239526, 'samples': 503232, 'steps': 2620, 'loss/train': 2.1913907527923584} +11/06/2021 21:38:11 - INFO - __main__ - Step 2622: {'lr': 0.0004999782798290424, 'samples': 503424, 'steps': 2621, 'loss/train': 2.0295615196228027} +11/06/2021 21:38:11 - INFO - __main__ - Step 2623: {'lr': 0.0004999782098214957, 'samples': 503616, 'steps': 2622, 'loss/train': 2.4918506145477295} +11/06/2021 21:38:12 - INFO - __main__ - Step 2624: {'lr': 0.0004999781397013127, 'samples': 503808, 'steps': 2623, 'loss/train': 2.2522714138031006} +11/06/2021 21:38:13 - INFO - __main__ - Step 2625: {'lr': 0.0004999780694684934, 'samples': 504000, 'steps': 2624, 'loss/train': 2.477266550064087} +11/06/2021 21:38:13 - INFO - __main__ - Step 2626: {'lr': 0.000499977999123038, 'samples': 504192, 'steps': 2625, 'loss/train': 2.451108455657959} +11/06/2021 21:38:13 - INFO - __main__ - Step 2627: {'lr': 0.0004999779286649461, 'samples': 504384, 'steps': 2626, 'loss/train': 2.620913028717041} +11/06/2021 21:38:14 - INFO - __main__ - Step 2628: {'lr': 0.0004999778580942183, 'samples': 504576, 'steps': 2627, 'loss/train': 1.3361049890518188} +11/06/2021 21:38:15 - INFO - __main__ - Step 2629: {'lr': 0.000499977787410854, 'samples': 504768, 'steps': 2628, 'loss/train': 2.3474013805389404} +11/06/2021 21:38:15 - INFO - __main__ - Step 2630: {'lr': 0.0004999777166148539, 'samples': 504960, 'steps': 2629, 'loss/train': 2.328670024871826} +11/06/2021 21:38:15 - INFO - __main__ - Step 2631: {'lr': 0.0004999776457062175, 'samples': 505152, 'steps': 2630, 'loss/train': 2.4533984661102295} +11/06/2021 21:38:16 - INFO - __main__ - Step 2632: {'lr': 0.0004999775746849451, 'samples': 505344, 'steps': 2631, 'loss/train': 1.9219590425491333} +11/06/2021 21:38:16 - INFO - __main__ - Step 2633: {'lr': 0.0004999775035510367, 'samples': 505536, 'steps': 2632, 'loss/train': 1.3246666193008423} +11/06/2021 21:38:17 - INFO - __main__ - Step 2634: {'lr': 0.0004999774323044922, 'samples': 505728, 'steps': 2633, 'loss/train': 2.5250437259674072} +11/06/2021 21:38:17 - INFO - __main__ - Step 2635: {'lr': 0.0004999773609453118, 'samples': 505920, 'steps': 2634, 'loss/train': 2.8457674980163574} +11/06/2021 21:38:18 - INFO - __main__ - Step 2636: {'lr': 0.0004999772894734954, 'samples': 506112, 'steps': 2635, 'loss/train': 1.6440210342407227} +11/06/2021 21:38:18 - INFO - __main__ - Step 2637: {'lr': 0.000499977217889043, 'samples': 506304, 'steps': 2636, 'loss/train': 2.209573984146118} +11/06/2021 21:38:18 - INFO - __main__ - Step 2638: {'lr': 0.0004999771461919549, 'samples': 506496, 'steps': 2637, 'loss/train': 2.6149797439575195} +11/06/2021 21:38:20 - INFO - __main__ - Step 2639: {'lr': 0.0004999770743822309, 'samples': 506688, 'steps': 2638, 'loss/train': 1.8034636974334717} +11/06/2021 21:38:20 - INFO - __main__ - Step 2640: {'lr': 0.0004999770024598711, 'samples': 506880, 'steps': 2639, 'loss/train': 2.848144054412842} +11/06/2021 21:38:20 - INFO - __main__ - Step 2641: {'lr': 0.0004999769304248754, 'samples': 507072, 'steps': 2640, 'loss/train': 2.00382661819458} +11/06/2021 21:38:21 - INFO - __main__ - Step 2642: {'lr': 0.0004999768582772442, 'samples': 507264, 'steps': 2641, 'loss/train': 2.284688711166382} +11/06/2021 21:38:21 - INFO - __main__ - Step 2643: {'lr': 0.000499976786016977, 'samples': 507456, 'steps': 2642, 'loss/train': 2.6324987411499023} +11/06/2021 21:38:22 - INFO - __main__ - Step 2644: {'lr': 0.0004999767136440742, 'samples': 507648, 'steps': 2643, 'loss/train': 2.4299545288085938} +11/06/2021 21:38:22 - INFO - __main__ - Step 2645: {'lr': 0.0004999766411585359, 'samples': 507840, 'steps': 2644, 'loss/train': 2.3650753498077393} +11/06/2021 21:38:23 - INFO - __main__ - Step 2646: {'lr': 0.0004999765685603618, 'samples': 508032, 'steps': 2645, 'loss/train': 1.2427858114242554} +11/06/2021 21:38:23 - INFO - __main__ - Step 2647: {'lr': 0.0004999764958495522, 'samples': 508224, 'steps': 2646, 'loss/train': 1.7125329971313477} +11/06/2021 21:38:23 - INFO - __main__ - Step 2648: {'lr': 0.0004999764230261072, 'samples': 508416, 'steps': 2647, 'loss/train': 2.69739031791687} +11/06/2021 21:38:24 - INFO - __main__ - Step 2649: {'lr': 0.0004999763500900265, 'samples': 508608, 'steps': 2648, 'loss/train': 2.207709550857544} +11/06/2021 21:38:25 - INFO - __main__ - Step 2650: {'lr': 0.0004999762770413103, 'samples': 508800, 'steps': 2649, 'loss/train': 2.108356237411499} +11/06/2021 21:38:25 - INFO - __main__ - Step 2651: {'lr': 0.0004999762038799587, 'samples': 508992, 'steps': 2650, 'loss/train': 2.2225661277770996} +11/06/2021 21:38:25 - INFO - __main__ - Step 2652: {'lr': 0.0004999761306059717, 'samples': 509184, 'steps': 2651, 'loss/train': 2.4659764766693115} +11/06/2021 21:38:26 - INFO - __main__ - Step 2653: {'lr': 0.0004999760572193492, 'samples': 509376, 'steps': 2652, 'loss/train': 2.0966432094573975} +11/06/2021 21:38:26 - INFO - __main__ - Step 2654: {'lr': 0.0004999759837200914, 'samples': 509568, 'steps': 2653, 'loss/train': 2.6494579315185547} +11/06/2021 21:38:27 - INFO - __main__ - Step 2655: {'lr': 0.0004999759101081984, 'samples': 509760, 'steps': 2654, 'loss/train': 2.213627815246582} +11/06/2021 21:38:28 - INFO - __main__ - Step 2656: {'lr': 0.0004999758363836701, 'samples': 509952, 'steps': 2655, 'loss/train': 2.514630079269409} +11/06/2021 21:38:28 - INFO - __main__ - Step 2657: {'lr': 0.0004999757625465063, 'samples': 510144, 'steps': 2656, 'loss/train': 1.6061630249023438} +11/06/2021 21:38:28 - INFO - __main__ - Step 2658: {'lr': 0.0004999756885967075, 'samples': 510336, 'steps': 2657, 'loss/train': 1.924759030342102} +11/06/2021 21:38:29 - INFO - __main__ - Step 2659: {'lr': 0.0004999756145342735, 'samples': 510528, 'steps': 2658, 'loss/train': 1.7294937372207642} +11/06/2021 21:38:30 - INFO - __main__ - Step 2660: {'lr': 0.0004999755403592043, 'samples': 510720, 'steps': 2659, 'loss/train': 2.623060941696167} +11/06/2021 21:38:30 - INFO - __main__ - Step 2661: {'lr': 0.0004999754660714999, 'samples': 510912, 'steps': 2660, 'loss/train': 2.1438426971435547} +11/06/2021 21:38:30 - INFO - __main__ - Step 2662: {'lr': 0.0004999753916711606, 'samples': 511104, 'steps': 2661, 'loss/train': 1.9994590282440186} +11/06/2021 21:38:31 - INFO - __main__ - Step 2663: {'lr': 0.0004999753171581862, 'samples': 511296, 'steps': 2662, 'loss/train': 2.382080554962158} +11/06/2021 21:38:31 - INFO - __main__ - Step 2664: {'lr': 0.0004999752425325766, 'samples': 511488, 'steps': 2663, 'loss/train': 2.0769588947296143} +11/06/2021 21:38:32 - INFO - __main__ - Step 2665: {'lr': 0.0004999751677943322, 'samples': 511680, 'steps': 2664, 'loss/train': 1.7713021039962769} +11/06/2021 21:38:32 - INFO - __main__ - Step 2666: {'lr': 0.0004999750929434527, 'samples': 511872, 'steps': 2665, 'loss/train': 2.075993537902832} +11/06/2021 21:38:33 - INFO - __main__ - Step 2667: {'lr': 0.0004999750179799383, 'samples': 512064, 'steps': 2666, 'loss/train': 2.5356898307800293} +11/06/2021 21:38:33 - INFO - __main__ - Step 2668: {'lr': 0.0004999749429037892, 'samples': 512256, 'steps': 2667, 'loss/train': 2.999053716659546} +11/06/2021 21:38:33 - INFO - __main__ - Step 2669: {'lr': 0.0004999748677150051, 'samples': 512448, 'steps': 2668, 'loss/train': 2.6738812923431396} +11/06/2021 21:38:34 - INFO - __main__ - Step 2670: {'lr': 0.0004999747924135862, 'samples': 512640, 'steps': 2669, 'loss/train': 2.2657175064086914} +11/06/2021 21:38:35 - INFO - __main__ - Step 2671: {'lr': 0.0004999747169995325, 'samples': 512832, 'steps': 2670, 'loss/train': 2.049834966659546} +11/06/2021 21:38:35 - INFO - __main__ - Step 2672: {'lr': 0.0004999746414728441, 'samples': 513024, 'steps': 2671, 'loss/train': 2.0094645023345947} +11/06/2021 21:38:35 - INFO - __main__ - Step 2673: {'lr': 0.0004999745658335209, 'samples': 513216, 'steps': 2672, 'loss/train': 2.6007511615753174} +11/06/2021 21:38:36 - INFO - __main__ - Step 2674: {'lr': 0.000499974490081563, 'samples': 513408, 'steps': 2673, 'loss/train': 2.5795583724975586} +11/06/2021 21:38:37 - INFO - __main__ - Step 2675: {'lr': 0.0004999744142169707, 'samples': 513600, 'steps': 2674, 'loss/train': 1.848941445350647} +11/06/2021 21:38:37 - INFO - __main__ - Step 2676: {'lr': 0.0004999743382397435, 'samples': 513792, 'steps': 2675, 'loss/train': 2.2464025020599365} +11/06/2021 21:38:38 - INFO - __main__ - Step 2677: {'lr': 0.0004999742621498818, 'samples': 513984, 'steps': 2676, 'loss/train': 2.2649552822113037} +11/06/2021 21:38:38 - INFO - __main__ - Step 2678: {'lr': 0.0004999741859473857, 'samples': 514176, 'steps': 2677, 'loss/train': 2.3065757751464844} +11/06/2021 21:38:38 - INFO - __main__ - Step 2679: {'lr': 0.0004999741096322549, 'samples': 514368, 'steps': 2678, 'loss/train': 2.34328031539917} +11/06/2021 21:38:39 - INFO - __main__ - Step 2680: {'lr': 0.0004999740332044898, 'samples': 514560, 'steps': 2679, 'loss/train': 2.229511022567749} +11/06/2021 21:38:40 - INFO - __main__ - Step 2681: {'lr': 0.0004999739566640901, 'samples': 514752, 'steps': 2680, 'loss/train': 2.1822242736816406} +11/06/2021 21:38:40 - INFO - __main__ - Step 2682: {'lr': 0.000499973880011056, 'samples': 514944, 'steps': 2681, 'loss/train': 2.409409999847412} +11/06/2021 21:38:41 - INFO - __main__ - Step 2683: {'lr': 0.0004999738032453876, 'samples': 515136, 'steps': 2682, 'loss/train': 2.3872311115264893} +11/06/2021 21:38:41 - INFO - __main__ - Step 2684: {'lr': 0.0004999737263670848, 'samples': 515328, 'steps': 2683, 'loss/train': 2.3661561012268066} +11/06/2021 21:38:41 - INFO - __main__ - Step 2685: {'lr': 0.0004999736493761477, 'samples': 515520, 'steps': 2684, 'loss/train': 2.4622879028320312} +11/06/2021 21:38:42 - INFO - __main__ - Step 2686: {'lr': 0.0004999735722725765, 'samples': 515712, 'steps': 2685, 'loss/train': 1.6226389408111572} +11/06/2021 21:38:43 - INFO - __main__ - Step 2687: {'lr': 0.0004999734950563709, 'samples': 515904, 'steps': 2686, 'loss/train': 2.3979785442352295} +11/06/2021 21:38:43 - INFO - __main__ - Step 2688: {'lr': 0.0004999734177275311, 'samples': 516096, 'steps': 2687, 'loss/train': 2.707308769226074} +11/06/2021 21:38:43 - INFO - __main__ - Step 2689: {'lr': 0.0004999733402860572, 'samples': 516288, 'steps': 2688, 'loss/train': 2.6095635890960693} +11/06/2021 21:38:44 - INFO - __main__ - Step 2690: {'lr': 0.0004999732627319491, 'samples': 516480, 'steps': 2689, 'loss/train': 2.480802297592163} +11/06/2021 21:38:45 - INFO - __main__ - Step 2691: {'lr': 0.000499973185065207, 'samples': 516672, 'steps': 2690, 'loss/train': 2.4791250228881836} +11/06/2021 21:38:45 - INFO - __main__ - Step 2692: {'lr': 0.0004999731072858307, 'samples': 516864, 'steps': 2691, 'loss/train': 2.2488434314727783} +11/06/2021 21:38:45 - INFO - __main__ - Step 2693: {'lr': 0.0004999730293938205, 'samples': 517056, 'steps': 2692, 'loss/train': 2.4395229816436768} +11/06/2021 21:38:46 - INFO - __main__ - Step 2694: {'lr': 0.0004999729513891762, 'samples': 517248, 'steps': 2693, 'loss/train': 2.7909016609191895} +11/06/2021 21:38:46 - INFO - __main__ - Step 2695: {'lr': 0.000499972873271898, 'samples': 517440, 'steps': 2694, 'loss/train': 2.6461949348449707} +11/06/2021 21:38:47 - INFO - __main__ - Step 2696: {'lr': 0.0004999727950419859, 'samples': 517632, 'steps': 2695, 'loss/train': 2.5715339183807373} +11/06/2021 21:38:48 - INFO - __main__ - Step 2697: {'lr': 0.0004999727166994399, 'samples': 517824, 'steps': 2696, 'loss/train': 2.065563917160034} +11/06/2021 21:38:48 - INFO - __main__ - Step 2698: {'lr': 0.0004999726382442601, 'samples': 518016, 'steps': 2697, 'loss/train': 1.9356613159179688} +11/06/2021 21:38:48 - INFO - __main__ - Step 2699: {'lr': 0.0004999725596764465, 'samples': 518208, 'steps': 2698, 'loss/train': 1.576759934425354} +11/06/2021 21:38:49 - INFO - __main__ - Step 2700: {'lr': 0.000499972480995999, 'samples': 518400, 'steps': 2699, 'loss/train': 2.4644877910614014} +11/06/2021 21:38:49 - INFO - __main__ - Step 2701: {'lr': 0.0004999724022029179, 'samples': 518592, 'steps': 2700, 'loss/train': 2.8699357509613037} +11/06/2021 21:38:51 - INFO - __main__ - Step 2702: {'lr': 0.000499972323297203, 'samples': 518784, 'steps': 2701, 'loss/train': 2.5225210189819336} +11/06/2021 21:38:51 - INFO - __main__ - Step 2703: {'lr': 0.0004999722442788544, 'samples': 518976, 'steps': 2702, 'loss/train': 2.4827229976654053} +11/06/2021 21:38:51 - INFO - __main__ - Step 2704: {'lr': 0.0004999721651478723, 'samples': 519168, 'steps': 2703, 'loss/train': 1.9105079174041748} +11/06/2021 21:38:52 - INFO - __main__ - Step 2705: {'lr': 0.0004999720859042565, 'samples': 519360, 'steps': 2704, 'loss/train': 2.2500193119049072} +11/06/2021 21:38:52 - INFO - __main__ - Step 2706: {'lr': 0.0004999720065480071, 'samples': 519552, 'steps': 2705, 'loss/train': 2.6277735233306885} +11/06/2021 21:38:52 - INFO - __main__ - Step 2707: {'lr': 0.0004999719270791242, 'samples': 519744, 'steps': 2706, 'loss/train': 1.4648323059082031} +11/06/2021 21:38:53 - INFO - __main__ - Step 2708: {'lr': 0.0004999718474976078, 'samples': 519936, 'steps': 2707, 'loss/train': 2.773413896560669} +11/06/2021 21:38:54 - INFO - __main__ - Step 2709: {'lr': 0.000499971767803458, 'samples': 520128, 'steps': 2708, 'loss/train': 2.3420262336730957} +11/06/2021 21:38:54 - INFO - __main__ - Step 2710: {'lr': 0.0004999716879966747, 'samples': 520320, 'steps': 2709, 'loss/train': 2.6745805740356445} +11/06/2021 21:38:54 - INFO - __main__ - Step 2711: {'lr': 0.000499971608077258, 'samples': 520512, 'steps': 2710, 'loss/train': 1.5498085021972656} +11/06/2021 21:38:55 - INFO - __main__ - Step 2712: {'lr': 0.000499971528045208, 'samples': 520704, 'steps': 2711, 'loss/train': 2.7040622234344482} +11/06/2021 21:38:55 - INFO - __main__ - Step 2713: {'lr': 0.0004999714479005248, 'samples': 520896, 'steps': 2712, 'loss/train': 3.5146377086639404} +11/06/2021 21:38:56 - INFO - __main__ - Step 2714: {'lr': 0.0004999713676432082, 'samples': 521088, 'steps': 2713, 'loss/train': 2.1871511936187744} +11/06/2021 21:38:56 - INFO - __main__ - Step 2715: {'lr': 0.0004999712872732584, 'samples': 521280, 'steps': 2714, 'loss/train': 2.5216920375823975} +11/06/2021 21:38:57 - INFO - __main__ - Step 2716: {'lr': 0.0004999712067906754, 'samples': 521472, 'steps': 2715, 'loss/train': 2.882300615310669} +11/06/2021 21:38:57 - INFO - __main__ - Step 2717: {'lr': 0.0004999711261954591, 'samples': 521664, 'steps': 2716, 'loss/train': 2.44183349609375} +11/06/2021 21:38:57 - INFO - __main__ - Step 2718: {'lr': 0.0004999710454876099, 'samples': 521856, 'steps': 2717, 'loss/train': 2.10378360748291} +11/06/2021 21:38:59 - INFO - __main__ - Step 2719: {'lr': 0.0004999709646671274, 'samples': 522048, 'steps': 2718, 'loss/train': 2.456674098968506} +11/06/2021 21:38:59 - INFO - __main__ - Step 2720: {'lr': 0.0004999708837340119, 'samples': 522240, 'steps': 2719, 'loss/train': 2.4138710498809814} +11/06/2021 21:38:59 - INFO - __main__ - Step 2721: {'lr': 0.0004999708026882635, 'samples': 522432, 'steps': 2720, 'loss/train': 2.910074234008789} +11/06/2021 21:39:00 - INFO - __main__ - Step 2722: {'lr': 0.000499970721529882, 'samples': 522624, 'steps': 2721, 'loss/train': 3.079136848449707} +11/06/2021 21:39:00 - INFO - __main__ - Step 2723: {'lr': 0.0004999706402588675, 'samples': 522816, 'steps': 2722, 'loss/train': 2.3095333576202393} +11/06/2021 21:39:01 - INFO - __main__ - Step 2724: {'lr': 0.0004999705588752202, 'samples': 523008, 'steps': 2723, 'loss/train': 1.8380732536315918} +11/06/2021 21:39:01 - INFO - __main__ - Step 2725: {'lr': 0.00049997047737894, 'samples': 523200, 'steps': 2724, 'loss/train': 2.072640895843506} +11/06/2021 21:39:02 - INFO - __main__ - Step 2726: {'lr': 0.0004999703957700269, 'samples': 523392, 'steps': 2725, 'loss/train': 2.321617603302002} +11/06/2021 21:39:02 - INFO - __main__ - Step 2727: {'lr': 0.000499970314048481, 'samples': 523584, 'steps': 2726, 'loss/train': 2.2870664596557617} +11/06/2021 21:39:02 - INFO - __main__ - Step 2728: {'lr': 0.0004999702322143023, 'samples': 523776, 'steps': 2727, 'loss/train': 2.508100748062134} +11/06/2021 21:39:03 - INFO - __main__ - Step 2729: {'lr': 0.000499970150267491, 'samples': 523968, 'steps': 2728, 'loss/train': 2.8131275177001953} +11/06/2021 21:39:04 - INFO - __main__ - Step 2730: {'lr': 0.0004999700682080469, 'samples': 524160, 'steps': 2729, 'loss/train': 2.412299871444702} +11/06/2021 21:39:04 - INFO - __main__ - Step 2731: {'lr': 0.0004999699860359702, 'samples': 524352, 'steps': 2730, 'loss/train': 2.656719446182251} +11/06/2021 21:39:04 - INFO - __main__ - Step 2732: {'lr': 0.0004999699037512608, 'samples': 524544, 'steps': 2731, 'loss/train': 2.0453786849975586} +11/06/2021 21:39:05 - INFO - __main__ - Step 2733: {'lr': 0.000499969821353919, 'samples': 524736, 'steps': 2732, 'loss/train': 1.5553648471832275} +11/06/2021 21:39:06 - INFO - __main__ - Step 2734: {'lr': 0.0004999697388439444, 'samples': 524928, 'steps': 2733, 'loss/train': 2.4622724056243896} +11/06/2021 21:39:06 - INFO - __main__ - Step 2735: {'lr': 0.0004999696562213375, 'samples': 525120, 'steps': 2734, 'loss/train': 2.221712827682495} +11/06/2021 21:39:06 - INFO - __main__ - Step 2736: {'lr': 0.0004999695734860981, 'samples': 525312, 'steps': 2735, 'loss/train': 2.3038675785064697} +11/06/2021 21:39:07 - INFO - __main__ - Step 2737: {'lr': 0.0004999694906382262, 'samples': 525504, 'steps': 2736, 'loss/train': 2.3742024898529053} +11/06/2021 21:39:07 - INFO - __main__ - Step 2738: {'lr': 0.0004999694076777219, 'samples': 525696, 'steps': 2737, 'loss/train': 2.387545347213745} +11/06/2021 21:39:08 - INFO - __main__ - Step 2739: {'lr': 0.0004999693246045854, 'samples': 525888, 'steps': 2738, 'loss/train': 2.2682254314422607} +11/06/2021 21:39:08 - INFO - __main__ - Step 2740: {'lr': 0.0004999692414188164, 'samples': 526080, 'steps': 2739, 'loss/train': 1.0920865535736084} +11/06/2021 21:39:09 - INFO - __main__ - Step 2741: {'lr': 0.0004999691581204152, 'samples': 526272, 'steps': 2740, 'loss/train': 2.4095451831817627} +11/06/2021 21:39:09 - INFO - __main__ - Step 2742: {'lr': 0.0004999690747093816, 'samples': 526464, 'steps': 2741, 'loss/train': 2.6026110649108887} +11/06/2021 21:39:09 - INFO - __main__ - Step 2743: {'lr': 0.000499968991185716, 'samples': 526656, 'steps': 2742, 'loss/train': 2.7001304626464844} +11/06/2021 21:39:10 - INFO - __main__ - Step 2744: {'lr': 0.0004999689075494182, 'samples': 526848, 'steps': 2743, 'loss/train': 2.8792505264282227} +11/06/2021 21:39:11 - INFO - __main__ - Step 2745: {'lr': 0.0004999688238004882, 'samples': 527040, 'steps': 2744, 'loss/train': 1.739349603652954} +11/06/2021 21:39:11 - INFO - __main__ - Step 2746: {'lr': 0.0004999687399389262, 'samples': 527232, 'steps': 2745, 'loss/train': 1.9313324689865112} +11/06/2021 21:39:11 - INFO - __main__ - Step 2747: {'lr': 0.0004999686559647319, 'samples': 527424, 'steps': 2746, 'loss/train': 2.5279910564422607} +11/06/2021 21:39:12 - INFO - __main__ - Step 2748: {'lr': 0.0004999685718779058, 'samples': 527616, 'steps': 2747, 'loss/train': 2.2004690170288086} +11/06/2021 21:39:12 - INFO - __main__ - Step 2749: {'lr': 0.0004999684876784477, 'samples': 527808, 'steps': 2748, 'loss/train': 2.4345414638519287} +11/06/2021 21:39:13 - INFO - __main__ - Step 2750: {'lr': 0.0004999684033663576, 'samples': 528000, 'steps': 2749, 'loss/train': 1.688835620880127} +11/06/2021 21:39:14 - INFO - __main__ - Step 2751: {'lr': 0.0004999683189416356, 'samples': 528192, 'steps': 2750, 'loss/train': 1.597861647605896} +11/06/2021 21:39:14 - INFO - __main__ - Step 2752: {'lr': 0.0004999682344042817, 'samples': 528384, 'steps': 2751, 'loss/train': 2.844277858734131} +11/06/2021 21:39:14 - INFO - __main__ - Step 2753: {'lr': 0.000499968149754296, 'samples': 528576, 'steps': 2752, 'loss/train': 2.3030660152435303} +11/06/2021 21:39:15 - INFO - __main__ - Step 2754: {'lr': 0.0004999680649916786, 'samples': 528768, 'steps': 2753, 'loss/train': 2.6878316402435303} +11/06/2021 21:39:16 - INFO - __main__ - Step 2755: {'lr': 0.0004999679801164295, 'samples': 528960, 'steps': 2754, 'loss/train': 0.8238305449485779} +11/06/2021 21:39:17 - INFO - __main__ - Step 2756: {'lr': 0.0004999678951285485, 'samples': 529152, 'steps': 2755, 'loss/train': 2.0880188941955566} +11/06/2021 21:39:17 - INFO - __main__ - Step 2757: {'lr': 0.0004999678100280358, 'samples': 529344, 'steps': 2756, 'loss/train': 2.4757795333862305} +11/06/2021 21:39:17 - INFO - __main__ - Step 2758: {'lr': 0.0004999677248148916, 'samples': 529536, 'steps': 2757, 'loss/train': 2.4732248783111572} +11/06/2021 21:39:18 - INFO - __main__ - Step 2759: {'lr': 0.0004999676394891158, 'samples': 529728, 'steps': 2758, 'loss/train': 2.1484673023223877} +11/06/2021 21:39:18 - INFO - __main__ - Step 2760: {'lr': 0.0004999675540507083, 'samples': 529920, 'steps': 2759, 'loss/train': 3.0172383785247803} +11/06/2021 21:39:19 - INFO - __main__ - Step 2761: {'lr': 0.0004999674684996694, 'samples': 530112, 'steps': 2760, 'loss/train': 2.785417079925537} +11/06/2021 21:39:19 - INFO - __main__ - Step 2762: {'lr': 0.0004999673828359989, 'samples': 530304, 'steps': 2761, 'loss/train': 2.5744974613189697} +11/06/2021 21:39:20 - INFO - __main__ - Step 2763: {'lr': 0.0004999672970596971, 'samples': 530496, 'steps': 2762, 'loss/train': 2.5258822441101074} +11/06/2021 21:39:20 - INFO - __main__ - Step 2764: {'lr': 0.0004999672111707639, 'samples': 530688, 'steps': 2763, 'loss/train': 3.058380603790283} +11/06/2021 21:39:21 - INFO - __main__ - Step 2765: {'lr': 0.0004999671251691991, 'samples': 530880, 'steps': 2764, 'loss/train': 2.8081789016723633} +11/06/2021 21:39:21 - INFO - __main__ - Step 2766: {'lr': 0.0004999670390550032, 'samples': 531072, 'steps': 2765, 'loss/train': 2.2795279026031494} +11/06/2021 21:39:22 - INFO - __main__ - Step 2767: {'lr': 0.000499966952828176, 'samples': 531264, 'steps': 2766, 'loss/train': 1.8465057611465454} +11/06/2021 21:39:22 - INFO - __main__ - Step 2768: {'lr': 0.0004999668664887175, 'samples': 531456, 'steps': 2767, 'loss/train': 2.2657551765441895} +11/06/2021 21:39:23 - INFO - __main__ - Step 2769: {'lr': 0.0004999667800366278, 'samples': 531648, 'steps': 2768, 'loss/train': 2.2362067699432373} +11/06/2021 21:39:23 - INFO - __main__ - Step 2770: {'lr': 0.0004999666934719069, 'samples': 531840, 'steps': 2769, 'loss/train': 1.8398356437683105} +11/06/2021 21:39:23 - INFO - __main__ - Step 2771: {'lr': 0.0004999666067945548, 'samples': 532032, 'steps': 2770, 'loss/train': 2.37894868850708} +11/06/2021 21:39:24 - INFO - __main__ - Step 2772: {'lr': 0.0004999665200045716, 'samples': 532224, 'steps': 2771, 'loss/train': 1.0660734176635742} +11/06/2021 21:39:25 - INFO - __main__ - Step 2773: {'lr': 0.0004999664331019574, 'samples': 532416, 'steps': 2772, 'loss/train': 2.489011287689209} +11/06/2021 21:39:25 - INFO - __main__ - Step 2774: {'lr': 0.0004999663460867123, 'samples': 532608, 'steps': 2773, 'loss/train': 2.3319153785705566} +11/06/2021 21:39:25 - INFO - __main__ - Step 2775: {'lr': 0.000499966258958836, 'samples': 532800, 'steps': 2774, 'loss/train': 2.5055582523345947} +11/06/2021 21:39:26 - INFO - __main__ - Step 2776: {'lr': 0.000499966171718329, 'samples': 532992, 'steps': 2775, 'loss/train': 2.4398868083953857} +11/06/2021 21:39:27 - INFO - __main__ - Step 2777: {'lr': 0.000499966084365191, 'samples': 533184, 'steps': 2776, 'loss/train': 2.4442226886749268} +11/06/2021 21:39:27 - INFO - __main__ - Step 2778: {'lr': 0.0004999659968994221, 'samples': 533376, 'steps': 2777, 'loss/train': 2.8139424324035645} +11/06/2021 21:39:28 - INFO - __main__ - Step 2779: {'lr': 0.0004999659093210223, 'samples': 533568, 'steps': 2778, 'loss/train': 2.4639973640441895} +11/06/2021 21:39:28 - INFO - __main__ - Step 2780: {'lr': 0.0004999658216299919, 'samples': 533760, 'steps': 2779, 'loss/train': 2.217278242111206} +11/06/2021 21:39:28 - INFO - __main__ - Step 2781: {'lr': 0.0004999657338263308, 'samples': 533952, 'steps': 2780, 'loss/train': 2.8546433448791504} +11/06/2021 21:39:29 - INFO - __main__ - Step 2782: {'lr': 0.0004999656459100388, 'samples': 534144, 'steps': 2781, 'loss/train': 2.2053894996643066} +11/06/2021 21:39:30 - INFO - __main__ - Step 2783: {'lr': 0.0004999655578811161, 'samples': 534336, 'steps': 2782, 'loss/train': 2.2209572792053223} +11/06/2021 21:39:30 - INFO - __main__ - Step 2784: {'lr': 0.0004999654697395629, 'samples': 534528, 'steps': 2783, 'loss/train': 2.64697527885437} +11/06/2021 21:39:30 - INFO - __main__ - Step 2785: {'lr': 0.0004999653814853791, 'samples': 534720, 'steps': 2784, 'loss/train': 2.1000912189483643} +11/06/2021 21:39:31 - INFO - __main__ - Step 2786: {'lr': 0.0004999652931185648, 'samples': 534912, 'steps': 2785, 'loss/train': 2.200310468673706} +11/06/2021 21:39:32 - INFO - __main__ - Step 2787: {'lr': 0.00049996520463912, 'samples': 535104, 'steps': 2786, 'loss/train': 2.8074491024017334} +11/06/2021 21:39:32 - INFO - __main__ - Step 2788: {'lr': 0.0004999651160470447, 'samples': 535296, 'steps': 2787, 'loss/train': 2.2512643337249756} +11/06/2021 21:39:32 - INFO - __main__ - Step 2789: {'lr': 0.0004999650273423389, 'samples': 535488, 'steps': 2788, 'loss/train': 2.207897663116455} +11/06/2021 21:39:33 - INFO - __main__ - Step 2790: {'lr': 0.0004999649385250028, 'samples': 535680, 'steps': 2789, 'loss/train': 2.473784923553467} +11/06/2021 21:39:33 - INFO - __main__ - Step 2791: {'lr': 0.0004999648495950363, 'samples': 535872, 'steps': 2790, 'loss/train': 2.487807273864746} +11/06/2021 21:39:34 - INFO - __main__ - Step 2792: {'lr': 0.0004999647605524396, 'samples': 536064, 'steps': 2791, 'loss/train': 2.234999895095825} +11/06/2021 21:39:35 - INFO - __main__ - Step 2793: {'lr': 0.0004999646713972126, 'samples': 536256, 'steps': 2792, 'loss/train': 2.1799986362457275} +11/06/2021 21:39:35 - INFO - __main__ - Step 2794: {'lr': 0.0004999645821293552, 'samples': 536448, 'steps': 2793, 'loss/train': 1.1634377241134644} +11/06/2021 21:39:35 - INFO - __main__ - Step 2795: {'lr': 0.0004999644927488678, 'samples': 536640, 'steps': 2794, 'loss/train': 2.290945529937744} +11/06/2021 21:39:36 - INFO - __main__ - Step 2796: {'lr': 0.0004999644032557503, 'samples': 536832, 'steps': 2795, 'loss/train': 2.273956537246704} +11/06/2021 21:39:37 - INFO - __main__ - Step 2797: {'lr': 0.0004999643136500027, 'samples': 537024, 'steps': 2796, 'loss/train': 1.5732803344726562} +11/06/2021 21:39:37 - INFO - __main__ - Step 2798: {'lr': 0.0004999642239316249, 'samples': 537216, 'steps': 2797, 'loss/train': 2.646408796310425} +11/06/2021 21:39:38 - INFO - __main__ - Step 2799: {'lr': 0.000499964134100617, 'samples': 537408, 'steps': 2798, 'loss/train': 2.802149772644043} +11/06/2021 21:39:38 - INFO - __main__ - Step 2800: {'lr': 0.0004999640441569793, 'samples': 537600, 'steps': 2799, 'loss/train': 1.9303408861160278} +11/06/2021 21:39:38 - INFO - __main__ - Step 2801: {'lr': 0.0004999639541007116, 'samples': 537792, 'steps': 2800, 'loss/train': 2.0123252868652344} +11/06/2021 21:39:39 - INFO - __main__ - Step 2802: {'lr': 0.0004999638639318141, 'samples': 537984, 'steps': 2801, 'loss/train': 2.5675606727600098} +11/06/2021 21:39:40 - INFO - __main__ - Step 2803: {'lr': 0.0004999637736502866, 'samples': 538176, 'steps': 2802, 'loss/train': 2.3583943843841553} +11/06/2021 21:39:40 - INFO - __main__ - Step 2804: {'lr': 0.0004999636832561293, 'samples': 538368, 'steps': 2803, 'loss/train': 2.4021947383880615} +11/06/2021 21:39:40 - INFO - __main__ - Step 2805: {'lr': 0.0004999635927493423, 'samples': 538560, 'steps': 2804, 'loss/train': 2.4244282245635986} +11/06/2021 21:39:41 - INFO - __main__ - Step 2806: {'lr': 0.0004999635021299255, 'samples': 538752, 'steps': 2805, 'loss/train': 2.661571741104126} +11/06/2021 21:39:41 - INFO - __main__ - Step 2807: {'lr': 0.0004999634113978791, 'samples': 538944, 'steps': 2806, 'loss/train': 2.562166929244995} +11/06/2021 21:39:42 - INFO - __main__ - Step 2808: {'lr': 0.0004999633205532029, 'samples': 539136, 'steps': 2807, 'loss/train': 2.0239551067352295} +11/06/2021 21:39:43 - INFO - __main__ - Step 2809: {'lr': 0.0004999632295958972, 'samples': 539328, 'steps': 2808, 'loss/train': 2.355177164077759} +11/06/2021 21:39:43 - INFO - __main__ - Step 2810: {'lr': 0.0004999631385259617, 'samples': 539520, 'steps': 2809, 'loss/train': 2.7225186824798584} +11/06/2021 21:39:43 - INFO - __main__ - Step 2811: {'lr': 0.000499963047343397, 'samples': 539712, 'steps': 2810, 'loss/train': 1.7809796333312988} +11/06/2021 21:39:44 - INFO - __main__ - Step 2812: {'lr': 0.0004999629560482026, 'samples': 539904, 'steps': 2811, 'loss/train': 1.2682995796203613} +11/06/2021 21:39:45 - INFO - __main__ - Step 2813: {'lr': 0.0004999628646403788, 'samples': 540096, 'steps': 2812, 'loss/train': 2.061248302459717} +11/06/2021 21:39:45 - INFO - __main__ - Step 2814: {'lr': 0.0004999627731199256, 'samples': 540288, 'steps': 2813, 'loss/train': 2.505889654159546} +11/06/2021 21:39:45 - INFO - __main__ - Step 2815: {'lr': 0.0004999626814868429, 'samples': 540480, 'steps': 2814, 'loss/train': 1.8169455528259277} +11/06/2021 21:39:46 - INFO - __main__ - Step 2816: {'lr': 0.0004999625897411311, 'samples': 540672, 'steps': 2815, 'loss/train': 2.5656561851501465} +11/06/2021 21:39:46 - INFO - __main__ - Step 2817: {'lr': 0.0004999624978827899, 'samples': 540864, 'steps': 2816, 'loss/train': 2.479475736618042} +11/06/2021 21:39:47 - INFO - __main__ - Step 2818: {'lr': 0.0004999624059118194, 'samples': 541056, 'steps': 2817, 'loss/train': 1.6999139785766602} +11/06/2021 21:39:47 - INFO - __main__ - Step 2819: {'lr': 0.0004999623138282198, 'samples': 541248, 'steps': 2818, 'loss/train': 2.207723617553711} +11/06/2021 21:39:48 - INFO - __main__ - Step 2820: {'lr': 0.000499962221631991, 'samples': 541440, 'steps': 2819, 'loss/train': 2.569610357284546} +11/06/2021 21:39:48 - INFO - __main__ - Step 2821: {'lr': 0.0004999621293231331, 'samples': 541632, 'steps': 2820, 'loss/train': 2.8650639057159424} +11/06/2021 21:39:48 - INFO - __main__ - Step 2822: {'lr': 0.0004999620369016461, 'samples': 541824, 'steps': 2821, 'loss/train': 2.0223443508148193} +11/06/2021 21:39:49 - INFO - __main__ - Step 2823: {'lr': 0.00049996194436753, 'samples': 542016, 'steps': 2822, 'loss/train': 2.039158344268799} +11/06/2021 21:39:50 - INFO - __main__ - Step 2824: {'lr': 0.000499961851720785, 'samples': 542208, 'steps': 2823, 'loss/train': 2.3247768878936768} +11/06/2021 21:39:50 - INFO - __main__ - Step 2825: {'lr': 0.000499961758961411, 'samples': 542400, 'steps': 2824, 'loss/train': 2.4017333984375} +11/06/2021 21:39:50 - INFO - __main__ - Step 2826: {'lr': 0.0004999616660894081, 'samples': 542592, 'steps': 2825, 'loss/train': 2.326307535171509} +11/06/2021 21:39:51 - INFO - __main__ - Step 2827: {'lr': 0.0004999615731047762, 'samples': 542784, 'steps': 2826, 'loss/train': 2.21771240234375} +11/06/2021 21:39:52 - INFO - __main__ - Step 2828: {'lr': 0.0004999614800075158, 'samples': 542976, 'steps': 2827, 'loss/train': 1.7368288040161133} +11/06/2021 21:39:52 - INFO - __main__ - Step 2829: {'lr': 0.0004999613867976264, 'samples': 543168, 'steps': 2828, 'loss/train': 2.7821502685546875} +11/06/2021 21:39:53 - INFO - __main__ - Step 2830: {'lr': 0.0004999612934751082, 'samples': 543360, 'steps': 2829, 'loss/train': 2.315138101577759} +11/06/2021 21:39:53 - INFO - __main__ - Step 2831: {'lr': 0.0004999612000399614, 'samples': 543552, 'steps': 2830, 'loss/train': 2.502418041229248} +11/06/2021 21:39:53 - INFO - __main__ - Step 2832: {'lr': 0.0004999611064921859, 'samples': 543744, 'steps': 2831, 'loss/train': 2.381127119064331} +11/06/2021 21:39:54 - INFO - __main__ - Step 2833: {'lr': 0.0004999610128317818, 'samples': 543936, 'steps': 2832, 'loss/train': 1.7340575456619263} +11/06/2021 21:39:55 - INFO - __main__ - Step 2834: {'lr': 0.0004999609190587492, 'samples': 544128, 'steps': 2833, 'loss/train': 2.435819387435913} +11/06/2021 21:39:55 - INFO - __main__ - Step 2835: {'lr': 0.000499960825173088, 'samples': 544320, 'steps': 2834, 'loss/train': 2.3425838947296143} +11/06/2021 21:39:55 - INFO - __main__ - Step 2836: {'lr': 0.0004999607311747983, 'samples': 544512, 'steps': 2835, 'loss/train': 1.7845638990402222} +11/06/2021 21:39:56 - INFO - __main__ - Step 2837: {'lr': 0.0004999606370638801, 'samples': 544704, 'steps': 2836, 'loss/train': 1.946204423904419} +11/06/2021 21:39:56 - INFO - __main__ - Step 2838: {'lr': 0.0004999605428403336, 'samples': 544896, 'steps': 2837, 'loss/train': 2.6006252765655518} +11/06/2021 21:39:57 - INFO - __main__ - Step 2839: {'lr': 0.0004999604485041585, 'samples': 545088, 'steps': 2838, 'loss/train': 2.409191131591797} +11/06/2021 21:39:57 - INFO - __main__ - Step 2840: {'lr': 0.0004999603540553554, 'samples': 545280, 'steps': 2839, 'loss/train': 2.562089204788208} +11/06/2021 21:39:58 - INFO - __main__ - Step 2841: {'lr': 0.0004999602594939238, 'samples': 545472, 'steps': 2840, 'loss/train': 2.2880022525787354} +11/06/2021 21:39:58 - INFO - __main__ - Step 2842: {'lr': 0.0004999601648198641, 'samples': 545664, 'steps': 2841, 'loss/train': 2.791858434677124} +11/06/2021 21:39:58 - INFO - __main__ - Step 2843: {'lr': 0.0004999600700331761, 'samples': 545856, 'steps': 2842, 'loss/train': 2.366997003555298} +11/06/2021 21:40:00 - INFO - __main__ - Step 2844: {'lr': 0.0004999599751338601, 'samples': 546048, 'steps': 2843, 'loss/train': 2.355536937713623} +11/06/2021 21:40:00 - INFO - __main__ - Step 2845: {'lr': 0.0004999598801219158, 'samples': 546240, 'steps': 2844, 'loss/train': 1.3548896312713623} +11/06/2021 21:40:00 - INFO - __main__ - Step 2846: {'lr': 0.0004999597849973435, 'samples': 546432, 'steps': 2845, 'loss/train': 2.1477577686309814} +11/06/2021 21:40:01 - INFO - __main__ - Step 2847: {'lr': 0.0004999596897601432, 'samples': 546624, 'steps': 2846, 'loss/train': 1.9438403844833374} +11/06/2021 21:40:01 - INFO - __main__ - Step 2848: {'lr': 0.0004999595944103149, 'samples': 546816, 'steps': 2847, 'loss/train': 2.6734774112701416} +11/06/2021 21:40:02 - INFO - __main__ - Step 2849: {'lr': 0.0004999594989478587, 'samples': 547008, 'steps': 2848, 'loss/train': 2.6153666973114014} +11/06/2021 21:40:02 - INFO - __main__ - Step 2850: {'lr': 0.0004999594033727747, 'samples': 547200, 'steps': 2849, 'loss/train': 2.0793142318725586} +11/06/2021 21:40:03 - INFO - __main__ - Step 2851: {'lr': 0.0004999593076850627, 'samples': 547392, 'steps': 2850, 'loss/train': 2.2441251277923584} +11/06/2021 21:40:03 - INFO - __main__ - Step 2852: {'lr': 0.0004999592118847229, 'samples': 547584, 'steps': 2851, 'loss/train': 2.7743895053863525} +11/06/2021 21:40:03 - INFO - __main__ - Step 2853: {'lr': 0.0004999591159717554, 'samples': 547776, 'steps': 2852, 'loss/train': 2.089233160018921} +11/06/2021 21:40:04 - INFO - __main__ - Step 2854: {'lr': 0.0004999590199461602, 'samples': 547968, 'steps': 2853, 'loss/train': 2.220766067504883} +11/06/2021 21:40:05 - INFO - __main__ - Step 2855: {'lr': 0.0004999589238079373, 'samples': 548160, 'steps': 2854, 'loss/train': 2.098376989364624} +11/06/2021 21:40:05 - INFO - __main__ - Step 2856: {'lr': 0.0004999588275570868, 'samples': 548352, 'steps': 2855, 'loss/train': 2.4644670486450195} +11/06/2021 21:40:05 - INFO - __main__ - Step 2857: {'lr': 0.0004999587311936086, 'samples': 548544, 'steps': 2856, 'loss/train': 2.239152193069458} +11/06/2021 21:40:06 - INFO - __main__ - Step 2858: {'lr': 0.000499958634717503, 'samples': 548736, 'steps': 2857, 'loss/train': 1.4249017238616943} +11/06/2021 21:40:07 - INFO - __main__ - Step 2859: {'lr': 0.0004999585381287696, 'samples': 548928, 'steps': 2858, 'loss/train': 2.2999162673950195} +11/06/2021 21:40:07 - INFO - __main__ - Step 2860: {'lr': 0.000499958441427409, 'samples': 549120, 'steps': 2859, 'loss/train': 2.8387157917022705} +11/06/2021 21:40:08 - INFO - __main__ - Step 2861: {'lr': 0.0004999583446134209, 'samples': 549312, 'steps': 2860, 'loss/train': 2.874333620071411} +11/06/2021 21:40:08 - INFO - __main__ - Step 2862: {'lr': 0.0004999582476868055, 'samples': 549504, 'steps': 2861, 'loss/train': 2.6905484199523926} +11/06/2021 21:40:08 - INFO - __main__ - Step 2863: {'lr': 0.0004999581506475627, 'samples': 549696, 'steps': 2862, 'loss/train': 2.1297647953033447} +11/06/2021 21:40:09 - INFO - __main__ - Step 2864: {'lr': 0.0004999580534956927, 'samples': 549888, 'steps': 2863, 'loss/train': 2.871276378631592} +11/06/2021 21:40:10 - INFO - __main__ - Step 2865: {'lr': 0.0004999579562311953, 'samples': 550080, 'steps': 2864, 'loss/train': 1.109349012374878} +11/06/2021 21:40:10 - INFO - __main__ - Step 2866: {'lr': 0.0004999578588540709, 'samples': 550272, 'steps': 2865, 'loss/train': 2.0491299629211426} +11/06/2021 21:40:10 - INFO - __main__ - Step 2867: {'lr': 0.0004999577613643192, 'samples': 550464, 'steps': 2866, 'loss/train': 2.0363290309906006} +11/06/2021 21:40:11 - INFO - __main__ - Step 2868: {'lr': 0.0004999576637619404, 'samples': 550656, 'steps': 2867, 'loss/train': 2.5006585121154785} +11/06/2021 21:40:11 - INFO - __main__ - Step 2869: {'lr': 0.0004999575660469347, 'samples': 550848, 'steps': 2868, 'loss/train': 2.5980803966522217} +11/06/2021 21:40:12 - INFO - __main__ - Step 2870: {'lr': 0.0004999574682193017, 'samples': 551040, 'steps': 2869, 'loss/train': 1.786831259727478} +11/06/2021 21:40:13 - INFO - __main__ - Step 2871: {'lr': 0.0004999573702790419, 'samples': 551232, 'steps': 2870, 'loss/train': 1.8787875175476074} +11/06/2021 21:40:13 - INFO - __main__ - Step 2872: {'lr': 0.0004999572722261551, 'samples': 551424, 'steps': 2871, 'loss/train': 1.8773044347763062} +11/06/2021 21:40:13 - INFO - __main__ - Step 2873: {'lr': 0.0004999571740606415, 'samples': 551616, 'steps': 2872, 'loss/train': 2.097402572631836} +11/06/2021 21:40:14 - INFO - __main__ - Step 2874: {'lr': 0.000499957075782501, 'samples': 551808, 'steps': 2873, 'loss/train': 1.8168832063674927} +11/06/2021 21:40:15 - INFO - __main__ - Step 2875: {'lr': 0.0004999569773917337, 'samples': 552000, 'steps': 2874, 'loss/train': 2.0323092937469482} +11/06/2021 21:40:15 - INFO - __main__ - Step 2876: {'lr': 0.0004999568788883397, 'samples': 552192, 'steps': 2875, 'loss/train': 1.8158880472183228} +11/06/2021 21:40:15 - INFO - __main__ - Step 2877: {'lr': 0.0004999567802723188, 'samples': 552384, 'steps': 2876, 'loss/train': 2.2598671913146973} +11/06/2021 21:40:16 - INFO - __main__ - Step 2878: {'lr': 0.0004999566815436715, 'samples': 552576, 'steps': 2877, 'loss/train': 2.445081949234009} +11/06/2021 21:40:16 - INFO - __main__ - Step 2879: {'lr': 0.0004999565827023974, 'samples': 552768, 'steps': 2878, 'loss/train': 2.130836009979248} +11/06/2021 21:40:17 - INFO - __main__ - Step 2880: {'lr': 0.0004999564837484967, 'samples': 552960, 'steps': 2879, 'loss/train': 2.3038902282714844} +11/06/2021 21:40:17 - INFO - __main__ - Step 2881: {'lr': 0.0004999563846819696, 'samples': 553152, 'steps': 2880, 'loss/train': 2.3476128578186035} +11/06/2021 21:40:18 - INFO - __main__ - Step 2882: {'lr': 0.0004999562855028159, 'samples': 553344, 'steps': 2881, 'loss/train': 2.6095919609069824} +11/06/2021 21:40:18 - INFO - __main__ - Step 2883: {'lr': 0.0004999561862110358, 'samples': 553536, 'steps': 2882, 'loss/train': 1.861746072769165} +11/06/2021 21:40:18 - INFO - __main__ - Step 2884: {'lr': 0.0004999560868066293, 'samples': 553728, 'steps': 2883, 'loss/train': 2.09774112701416} +11/06/2021 21:40:20 - INFO - __main__ - Step 2885: {'lr': 0.0004999559872895964, 'samples': 553920, 'steps': 2884, 'loss/train': 1.9192487001419067} +11/06/2021 21:40:20 - INFO - __main__ - Step 2886: {'lr': 0.0004999558876599373, 'samples': 554112, 'steps': 2885, 'loss/train': 2.2191450595855713} +11/06/2021 21:40:20 - INFO - __main__ - Step 2887: {'lr': 0.0004999557879176518, 'samples': 554304, 'steps': 2886, 'loss/train': 2.411027193069458} +11/06/2021 21:40:21 - INFO - __main__ - Step 2888: {'lr': 0.0004999556880627401, 'samples': 554496, 'steps': 2887, 'loss/train': 2.7569634914398193} +11/06/2021 21:40:21 - INFO - __main__ - Step 2889: {'lr': 0.0004999555880952023, 'samples': 554688, 'steps': 2888, 'loss/train': 2.49636173248291} +11/06/2021 21:40:22 - INFO - __main__ - Step 2890: {'lr': 0.0004999554880150383, 'samples': 554880, 'steps': 2889, 'loss/train': 2.0643162727355957} +11/06/2021 21:40:22 - INFO - __main__ - Step 2891: {'lr': 0.0004999553878222482, 'samples': 555072, 'steps': 2890, 'loss/train': 1.2182731628417969} +11/06/2021 21:40:23 - INFO - __main__ - Step 2892: {'lr': 0.0004999552875168321, 'samples': 555264, 'steps': 2891, 'loss/train': 2.110027551651001} +11/06/2021 21:40:23 - INFO - __main__ - Step 2893: {'lr': 0.0004999551870987901, 'samples': 555456, 'steps': 2892, 'loss/train': 2.0621578693389893} +11/06/2021 21:40:23 - INFO - __main__ - Step 2894: {'lr': 0.000499955086568122, 'samples': 555648, 'steps': 2893, 'loss/train': 2.4326114654541016} +11/06/2021 21:40:24 - INFO - __main__ - Step 2895: {'lr': 0.000499954985924828, 'samples': 555840, 'steps': 2894, 'loss/train': 1.992488980293274} +11/06/2021 21:40:25 - INFO - __main__ - Step 2896: {'lr': 0.0004999548851689082, 'samples': 556032, 'steps': 2895, 'loss/train': 1.6926281452178955} +11/06/2021 21:40:25 - INFO - __main__ - Step 2897: {'lr': 0.0004999547843003627, 'samples': 556224, 'steps': 2896, 'loss/train': 2.2497506141662598} +11/06/2021 21:40:25 - INFO - __main__ - Step 2898: {'lr': 0.0004999546833191912, 'samples': 556416, 'steps': 2897, 'loss/train': 2.4135076999664307} +11/06/2021 21:40:26 - INFO - __main__ - Step 2899: {'lr': 0.0004999545822253941, 'samples': 556608, 'steps': 2898, 'loss/train': 1.9909908771514893} +11/06/2021 21:40:27 - INFO - __main__ - Step 2900: {'lr': 0.0004999544810189713, 'samples': 556800, 'steps': 2899, 'loss/train': 1.9784951210021973} +11/06/2021 21:40:27 - INFO - __main__ - Step 2901: {'lr': 0.0004999543796999228, 'samples': 556992, 'steps': 2900, 'loss/train': 2.4324984550476074} +11/06/2021 21:40:27 - INFO - __main__ - Step 2902: {'lr': 0.0004999542782682489, 'samples': 557184, 'steps': 2901, 'loss/train': 1.6676363945007324} +11/06/2021 21:40:28 - INFO - __main__ - Step 2903: {'lr': 0.0004999541767239493, 'samples': 557376, 'steps': 2902, 'loss/train': 2.2086076736450195} +11/06/2021 21:40:28 - INFO - __main__ - Step 2904: {'lr': 0.0004999540750670243, 'samples': 557568, 'steps': 2903, 'loss/train': 2.221266746520996} +11/06/2021 21:40:28 - INFO - __main__ - Step 2905: {'lr': 0.0004999539732974738, 'samples': 557760, 'steps': 2904, 'loss/train': 1.9565421342849731} +11/06/2021 21:40:29 - INFO - __main__ - Step 2906: {'lr': 0.0004999538714152978, 'samples': 557952, 'steps': 2905, 'loss/train': 2.1874446868896484} +11/06/2021 21:40:30 - INFO - __main__ - Step 2907: {'lr': 0.0004999537694204966, 'samples': 558144, 'steps': 2906, 'loss/train': 1.4559849500656128} +11/06/2021 21:40:30 - INFO - __main__ - Step 2908: {'lr': 0.0004999536673130701, 'samples': 558336, 'steps': 2907, 'loss/train': 2.1022891998291016} +11/06/2021 21:40:30 - INFO - __main__ - Step 2909: {'lr': 0.0004999535650930182, 'samples': 558528, 'steps': 2908, 'loss/train': 1.6833531856536865} +11/06/2021 21:40:31 - INFO - __main__ - Step 2910: {'lr': 0.0004999534627603411, 'samples': 558720, 'steps': 2909, 'loss/train': 1.6895768642425537} +11/06/2021 21:40:33 - INFO - __main__ - Step 2911: {'lr': 0.0004999533603150389, 'samples': 558912, 'steps': 2910, 'loss/train': 2.199605703353882} +11/06/2021 21:40:33 - INFO - __main__ - Step 2912: {'lr': 0.0004999532577571116, 'samples': 559104, 'steps': 2911, 'loss/train': 2.348113536834717} +11/06/2021 21:40:33 - INFO - __main__ - Step 2913: {'lr': 0.0004999531550865592, 'samples': 559296, 'steps': 2912, 'loss/train': 1.9907268285751343} +11/06/2021 21:40:34 - INFO - __main__ - Step 2914: {'lr': 0.0004999530523033817, 'samples': 559488, 'steps': 2913, 'loss/train': 1.3060599565505981} +11/06/2021 21:40:34 - INFO - __main__ - Step 2915: {'lr': 0.0004999529494075792, 'samples': 559680, 'steps': 2914, 'loss/train': 2.2429051399230957} +11/06/2021 21:40:34 - INFO - __main__ - Step 2916: {'lr': 0.0004999528463991518, 'samples': 559872, 'steps': 2915, 'loss/train': 3.520594596862793} +11/06/2021 21:40:35 - INFO - __main__ - Step 2917: {'lr': 0.0004999527432780995, 'samples': 560064, 'steps': 2916, 'loss/train': 2.8024425506591797} +11/06/2021 21:40:36 - INFO - __main__ - Step 2918: {'lr': 0.0004999526400444223, 'samples': 560256, 'steps': 2917, 'loss/train': 2.3068015575408936} +11/06/2021 21:40:36 - INFO - __main__ - Step 2919: {'lr': 0.0004999525366981204, 'samples': 560448, 'steps': 2918, 'loss/train': 2.4727816581726074} +11/06/2021 21:40:36 - INFO - __main__ - Step 2920: {'lr': 0.0004999524332391937, 'samples': 560640, 'steps': 2919, 'loss/train': 1.4589003324508667} +11/06/2021 21:40:37 - INFO - __main__ - Step 2921: {'lr': 0.0004999523296676423, 'samples': 560832, 'steps': 2920, 'loss/train': 2.8546531200408936} +11/06/2021 21:40:38 - INFO - __main__ - Step 2922: {'lr': 0.0004999522259834662, 'samples': 561024, 'steps': 2921, 'loss/train': 2.01436185836792} +11/06/2021 21:40:38 - INFO - __main__ - Step 2923: {'lr': 0.0004999521221866655, 'samples': 561216, 'steps': 2922, 'loss/train': 2.9022979736328125} +11/06/2021 21:40:38 - INFO - __main__ - Step 2924: {'lr': 0.0004999520182772402, 'samples': 561408, 'steps': 2923, 'loss/train': 2.112090826034546} +11/06/2021 21:40:39 - INFO - __main__ - Step 2925: {'lr': 0.0004999519142551905, 'samples': 561600, 'steps': 2924, 'loss/train': 2.724461317062378} +11/06/2021 21:40:39 - INFO - __main__ - Step 2926: {'lr': 0.0004999518101205162, 'samples': 561792, 'steps': 2925, 'loss/train': 3.0705063343048096} +11/06/2021 21:40:40 - INFO - __main__ - Step 2927: {'lr': 0.0004999517058732175, 'samples': 561984, 'steps': 2926, 'loss/train': 2.3945233821868896} +11/06/2021 21:40:41 - INFO - __main__ - Step 2928: {'lr': 0.0004999516015132945, 'samples': 562176, 'steps': 2927, 'loss/train': 1.2997283935546875} +11/06/2021 21:40:41 - INFO - __main__ - Step 2929: {'lr': 0.0004999514970407471, 'samples': 562368, 'steps': 2928, 'loss/train': 1.4309011697769165} +11/06/2021 21:40:41 - INFO - __main__ - Step 2930: {'lr': 0.0004999513924555754, 'samples': 562560, 'steps': 2929, 'loss/train': 1.5472474098205566} +11/06/2021 21:40:42 - INFO - __main__ - Step 2931: {'lr': 0.0004999512877577794, 'samples': 562752, 'steps': 2930, 'loss/train': 2.173020601272583} +11/06/2021 21:40:43 - INFO - __main__ - Step 2932: {'lr': 0.0004999511829473593, 'samples': 562944, 'steps': 2931, 'loss/train': 1.8353915214538574} +11/06/2021 21:40:43 - INFO - __main__ - Step 2933: {'lr': 0.0004999510780243151, 'samples': 563136, 'steps': 2932, 'loss/train': 1.7260181903839111} +11/06/2021 21:40:43 - INFO - __main__ - Step 2934: {'lr': 0.0004999509729886467, 'samples': 563328, 'steps': 2933, 'loss/train': 2.6757678985595703} +11/06/2021 21:40:44 - INFO - __main__ - Step 2935: {'lr': 0.0004999508678403542, 'samples': 563520, 'steps': 2934, 'loss/train': 2.1792075634002686} +11/06/2021 21:40:44 - INFO - __main__ - Step 2936: {'lr': 0.0004999507625794378, 'samples': 563712, 'steps': 2935, 'loss/train': 2.2181787490844727} +11/06/2021 21:40:45 - INFO - __main__ - Step 2937: {'lr': 0.0004999506572058974, 'samples': 563904, 'steps': 2936, 'loss/train': 2.060746192932129} +11/06/2021 21:40:45 - INFO - __main__ - Step 2938: {'lr': 0.0004999505517197331, 'samples': 564096, 'steps': 2937, 'loss/train': 2.2606637477874756} +11/06/2021 21:40:46 - INFO - __main__ - Step 2939: {'lr': 0.000499950446120945, 'samples': 564288, 'steps': 2938, 'loss/train': 1.9064645767211914} +11/06/2021 21:40:46 - INFO - __main__ - Step 2940: {'lr': 0.000499950340409533, 'samples': 564480, 'steps': 2939, 'loss/train': 2.1608986854553223} +11/06/2021 21:40:46 - INFO - __main__ - Step 2941: {'lr': 0.0004999502345854973, 'samples': 564672, 'steps': 2940, 'loss/train': 2.2429375648498535} +11/06/2021 21:40:47 - INFO - __main__ - Step 2942: {'lr': 0.0004999501286488378, 'samples': 564864, 'steps': 2941, 'loss/train': 2.142625093460083} +11/06/2021 21:40:48 - INFO - __main__ - Step 2943: {'lr': 0.0004999500225995547, 'samples': 565056, 'steps': 2942, 'loss/train': 2.0483415126800537} +11/06/2021 21:40:48 - INFO - __main__ - Step 2944: {'lr': 0.000499949916437648, 'samples': 565248, 'steps': 2943, 'loss/train': 2.363560199737549} +11/06/2021 21:40:49 - INFO - __main__ - Step 2945: {'lr': 0.0004999498101631177, 'samples': 565440, 'steps': 2944, 'loss/train': 2.750171422958374} +11/06/2021 21:40:49 - INFO - __main__ - Step 2946: {'lr': 0.0004999497037759638, 'samples': 565632, 'steps': 2945, 'loss/train': 2.285203218460083} +11/06/2021 21:40:49 - INFO - __main__ - Step 2947: {'lr': 0.0004999495972761865, 'samples': 565824, 'steps': 2946, 'loss/train': 2.084728479385376} +11/06/2021 21:40:50 - INFO - __main__ - Step 2948: {'lr': 0.0004999494906637857, 'samples': 566016, 'steps': 2947, 'loss/train': 2.138784646987915} +11/06/2021 21:40:51 - INFO - __main__ - Step 2949: {'lr': 0.0004999493839387615, 'samples': 566208, 'steps': 2948, 'loss/train': 0.8493632674217224} +11/06/2021 21:40:51 - INFO - __main__ - Step 2950: {'lr': 0.000499949277101114, 'samples': 566400, 'steps': 2949, 'loss/train': 2.2582223415374756} +11/06/2021 21:40:51 - INFO - __main__ - Step 2951: {'lr': 0.0004999491701508433, 'samples': 566592, 'steps': 2950, 'loss/train': 2.1516506671905518} +11/06/2021 21:40:52 - INFO - __main__ - Step 2952: {'lr': 0.0004999490630879493, 'samples': 566784, 'steps': 2951, 'loss/train': 1.5355583429336548} +11/06/2021 21:40:53 - INFO - __main__ - Step 2953: {'lr': 0.0004999489559124321, 'samples': 566976, 'steps': 2952, 'loss/train': 1.9333853721618652} +11/06/2021 21:40:53 - INFO - __main__ - Step 2954: {'lr': 0.0004999488486242918, 'samples': 567168, 'steps': 2953, 'loss/train': 1.470977783203125} +11/06/2021 21:40:53 - INFO - __main__ - Step 2955: {'lr': 0.0004999487412235284, 'samples': 567360, 'steps': 2954, 'loss/train': 2.435324192047119} +11/06/2021 21:40:54 - INFO - __main__ - Step 2956: {'lr': 0.0004999486337101419, 'samples': 567552, 'steps': 2955, 'loss/train': 2.1768510341644287} +11/06/2021 21:40:54 - INFO - __main__ - Step 2957: {'lr': 0.0004999485260841324, 'samples': 567744, 'steps': 2956, 'loss/train': 2.5534868240356445} +11/06/2021 21:40:55 - INFO - __main__ - Step 2958: {'lr': 0.0004999484183455, 'samples': 567936, 'steps': 2957, 'loss/train': 2.551486015319824} +11/06/2021 21:40:55 - INFO - __main__ - Step 2959: {'lr': 0.0004999483104942446, 'samples': 568128, 'steps': 2958, 'loss/train': 2.710608720779419} +11/06/2021 21:40:56 - INFO - __main__ - Step 2960: {'lr': 0.0004999482025303665, 'samples': 568320, 'steps': 2959, 'loss/train': 2.0834438800811768} +11/06/2021 21:40:56 - INFO - __main__ - Step 2961: {'lr': 0.0004999480944538655, 'samples': 568512, 'steps': 2960, 'loss/train': 2.1335995197296143} +11/06/2021 21:40:57 - INFO - __main__ - Step 2962: {'lr': 0.0004999479862647417, 'samples': 568704, 'steps': 2961, 'loss/train': 1.7323172092437744} +11/06/2021 21:40:57 - INFO - __main__ - Step 2963: {'lr': 0.0004999478779629953, 'samples': 568896, 'steps': 2962, 'loss/train': 1.3542144298553467} +11/06/2021 21:40:58 - INFO - __main__ - Step 2964: {'lr': 0.0004999477695486261, 'samples': 569088, 'steps': 2963, 'loss/train': 2.248361349105835} +11/06/2021 21:40:58 - INFO - __main__ - Step 2965: {'lr': 0.0004999476610216345, 'samples': 569280, 'steps': 2964, 'loss/train': 1.651444673538208} +11/06/2021 21:40:59 - INFO - __main__ - Step 2966: {'lr': 0.0004999475523820203, 'samples': 569472, 'steps': 2965, 'loss/train': 1.6673521995544434} +11/06/2021 21:40:59 - INFO - __main__ - Step 2967: {'lr': 0.0004999474436297835, 'samples': 569664, 'steps': 2966, 'loss/train': 2.576014995574951} +11/06/2021 21:40:59 - INFO - __main__ - Step 2968: {'lr': 0.0004999473347649242, 'samples': 569856, 'steps': 2967, 'loss/train': 2.7090260982513428} +11/06/2021 21:41:00 - INFO - __main__ - Step 2969: {'lr': 0.0004999472257874426, 'samples': 570048, 'steps': 2968, 'loss/train': 2.4172799587249756} +11/06/2021 21:41:01 - INFO - __main__ - Step 2970: {'lr': 0.0004999471166973385, 'samples': 570240, 'steps': 2969, 'loss/train': 2.754880905151367} +11/06/2021 21:41:01 - INFO - __main__ - Step 2971: {'lr': 0.0004999470074946122, 'samples': 570432, 'steps': 2970, 'loss/train': 2.2452704906463623} +11/06/2021 21:41:01 - INFO - __main__ - Step 2972: {'lr': 0.0004999468981792636, 'samples': 570624, 'steps': 2971, 'loss/train': 1.8505585193634033} +11/06/2021 21:41:02 - INFO - __main__ - Step 2973: {'lr': 0.0004999467887512928, 'samples': 570816, 'steps': 2972, 'loss/train': 2.324302911758423} +11/06/2021 21:41:03 - INFO - __main__ - Step 2974: {'lr': 0.0004999466792106998, 'samples': 571008, 'steps': 2973, 'loss/train': 2.198997974395752} +11/06/2021 21:41:03 - INFO - __main__ - Step 2975: {'lr': 0.0004999465695574848, 'samples': 571200, 'steps': 2974, 'loss/train': 2.4964334964752197} +11/06/2021 21:41:03 - INFO - __main__ - Step 2976: {'lr': 0.0004999464597916476, 'samples': 571392, 'steps': 2975, 'loss/train': 2.4963150024414062} +11/06/2021 21:41:04 - INFO - __main__ - Step 2977: {'lr': 0.0004999463499131884, 'samples': 571584, 'steps': 2976, 'loss/train': 2.5181667804718018} +11/06/2021 21:41:04 - INFO - __main__ - Step 2978: {'lr': 0.0004999462399221073, 'samples': 571776, 'steps': 2977, 'loss/train': 3.5236194133758545} +11/06/2021 21:41:05 - INFO - __main__ - Step 2979: {'lr': 0.0004999461298184042, 'samples': 571968, 'steps': 2978, 'loss/train': 2.367652416229248} +11/06/2021 21:41:06 - INFO - __main__ - Step 2980: {'lr': 0.0004999460196020793, 'samples': 572160, 'steps': 2979, 'loss/train': 2.657733201980591} +11/06/2021 21:41:06 - INFO - __main__ - Step 2981: {'lr': 0.0004999459092731326, 'samples': 572352, 'steps': 2980, 'loss/train': 2.142723321914673} +11/06/2021 21:41:06 - INFO - __main__ - Step 2982: {'lr': 0.000499945798831564, 'samples': 572544, 'steps': 2981, 'loss/train': 2.780032157897949} +11/06/2021 21:41:07 - INFO - __main__ - Step 2983: {'lr': 0.0004999456882773737, 'samples': 572736, 'steps': 2982, 'loss/train': 2.4689583778381348} +11/06/2021 21:41:08 - INFO - __main__ - Step 2984: {'lr': 0.0004999455776105618, 'samples': 572928, 'steps': 2983, 'loss/train': 1.9315149784088135} +11/06/2021 21:41:08 - INFO - __main__ - Step 2985: {'lr': 0.0004999454668311283, 'samples': 573120, 'steps': 2984, 'loss/train': 2.1817145347595215} +11/06/2021 21:41:08 - INFO - __main__ - Step 2986: {'lr': 0.0004999453559390731, 'samples': 573312, 'steps': 2985, 'loss/train': 2.152888774871826} +11/06/2021 21:41:09 - INFO - __main__ - Step 2987: {'lr': 0.0004999452449343967, 'samples': 573504, 'steps': 2986, 'loss/train': 2.3532779216766357} +11/06/2021 21:41:09 - INFO - __main__ - Step 2988: {'lr': 0.0004999451338170985, 'samples': 573696, 'steps': 2987, 'loss/train': 2.4001834392547607} +11/06/2021 21:41:10 - INFO - __main__ - Step 2989: {'lr': 0.000499945022587179, 'samples': 573888, 'steps': 2988, 'loss/train': 2.3787949085235596} +11/06/2021 21:41:10 - INFO - __main__ - Step 2990: {'lr': 0.0004999449112446381, 'samples': 574080, 'steps': 2989, 'loss/train': 2.610903263092041} +11/06/2021 21:41:11 - INFO - __main__ - Step 2991: {'lr': 0.000499944799789476, 'samples': 574272, 'steps': 2990, 'loss/train': 2.203000545501709} +11/06/2021 21:41:11 - INFO - __main__ - Step 2992: {'lr': 0.0004999446882216925, 'samples': 574464, 'steps': 2991, 'loss/train': 1.9404032230377197} +11/06/2021 21:41:11 - INFO - __main__ - Step 2993: {'lr': 0.0004999445765412878, 'samples': 574656, 'steps': 2992, 'loss/train': 2.0062878131866455} +11/06/2021 21:41:12 - INFO - __main__ - Step 2994: {'lr': 0.0004999444647482619, 'samples': 574848, 'steps': 2993, 'loss/train': 2.512753963470459} +11/06/2021 21:41:13 - INFO - __main__ - Step 2995: {'lr': 0.0004999443528426149, 'samples': 575040, 'steps': 2994, 'loss/train': 2.4999752044677734} +11/06/2021 21:41:13 - INFO - __main__ - Step 2996: {'lr': 0.0004999442408243469, 'samples': 575232, 'steps': 2995, 'loss/train': 2.140004873275757} +11/06/2021 21:41:13 - INFO - __main__ - Step 2997: {'lr': 0.0004999441286934578, 'samples': 575424, 'steps': 2996, 'loss/train': 2.258283853530884} +11/06/2021 21:41:14 - INFO - __main__ - Step 2998: {'lr': 0.0004999440164499478, 'samples': 575616, 'steps': 2997, 'loss/train': 2.103290557861328} +11/06/2021 21:41:14 - INFO - __main__ - Step 2999: {'lr': 0.0004999439040938168, 'samples': 575808, 'steps': 2998, 'loss/train': 2.217271327972412} +11/06/2021 21:41:15 - INFO - __main__ - Step 3000: {'lr': 0.000499943791625065, 'samples': 576000, 'steps': 2999, 'loss/train': 2.1993706226348877} +11/06/2021 21:41:15 - INFO - __main__ - Step 3001: {'lr': 0.0004999436790436923, 'samples': 576192, 'steps': 3000, 'loss/train': 1.9046951532363892} +11/06/2021 21:41:16 - INFO - __main__ - Step 3002: {'lr': 0.000499943566349699, 'samples': 576384, 'steps': 3001, 'loss/train': 2.5663747787475586} +11/06/2021 21:41:16 - INFO - __main__ - Step 3003: {'lr': 0.0004999434535430848, 'samples': 576576, 'steps': 3002, 'loss/train': 2.3395111560821533} +11/06/2021 21:41:17 - INFO - __main__ - Step 3004: {'lr': 0.0004999433406238501, 'samples': 576768, 'steps': 3003, 'loss/train': 2.3144681453704834} +11/06/2021 21:41:18 - INFO - __main__ - Step 3005: {'lr': 0.0004999432275919947, 'samples': 576960, 'steps': 3004, 'loss/train': 2.3449320793151855} +11/06/2021 21:41:18 - INFO - __main__ - Step 3006: {'lr': 0.0004999431144475187, 'samples': 577152, 'steps': 3005, 'loss/train': 2.1510040760040283} +11/06/2021 21:41:18 - INFO - __main__ - Step 3007: {'lr': 0.0004999430011904222, 'samples': 577344, 'steps': 3006, 'loss/train': 0.7324512004852295} +11/06/2021 21:41:19 - INFO - __main__ - Step 3008: {'lr': 0.0004999428878207054, 'samples': 577536, 'steps': 3007, 'loss/train': 2.3040289878845215} +11/06/2021 21:41:19 - INFO - __main__ - Step 3009: {'lr': 0.000499942774338368, 'samples': 577728, 'steps': 3008, 'loss/train': 2.3875339031219482} +11/06/2021 21:41:20 - INFO - __main__ - Step 3010: {'lr': 0.0004999426607434104, 'samples': 577920, 'steps': 3009, 'loss/train': 2.562206268310547} +11/06/2021 21:41:20 - INFO - __main__ - Step 3011: {'lr': 0.0004999425470358324, 'samples': 578112, 'steps': 3010, 'loss/train': 2.1042847633361816} +11/06/2021 21:41:21 - INFO - __main__ - Step 3012: {'lr': 0.0004999424332156341, 'samples': 578304, 'steps': 3011, 'loss/train': 1.8335940837860107} +11/06/2021 21:41:21 - INFO - __main__ - Step 3013: {'lr': 0.0004999423192828156, 'samples': 578496, 'steps': 3012, 'loss/train': 2.3943774700164795} +11/06/2021 21:41:21 - INFO - __main__ - Step 3014: {'lr': 0.0004999422052373771, 'samples': 578688, 'steps': 3013, 'loss/train': 2.3687760829925537} +11/06/2021 21:41:23 - INFO - __main__ - Step 3015: {'lr': 0.0004999420910793183, 'samples': 578880, 'steps': 3014, 'loss/train': 2.2933881282806396} +11/06/2021 21:41:23 - INFO - __main__ - Step 3016: {'lr': 0.0004999419768086397, 'samples': 579072, 'steps': 3015, 'loss/train': 2.4723987579345703} +11/06/2021 21:41:23 - INFO - __main__ - Step 3017: {'lr': 0.0004999418624253408, 'samples': 579264, 'steps': 3016, 'loss/train': 2.3024117946624756} +11/06/2021 21:41:24 - INFO - __main__ - Step 3018: {'lr': 0.0004999417479294221, 'samples': 579456, 'steps': 3017, 'loss/train': 2.373169183731079} +11/06/2021 21:41:24 - INFO - __main__ - Step 3019: {'lr': 0.0004999416333208835, 'samples': 579648, 'steps': 3018, 'loss/train': 1.6759024858474731} +11/06/2021 21:41:25 - INFO - __main__ - Step 3020: {'lr': 0.0004999415185997252, 'samples': 579840, 'steps': 3019, 'loss/train': 2.323343515396118} +11/06/2021 21:41:25 - INFO - __main__ - Step 3021: {'lr': 0.0004999414037659468, 'samples': 580032, 'steps': 3020, 'loss/train': 1.5138059854507446} +11/06/2021 21:41:26 - INFO - __main__ - Step 3022: {'lr': 0.000499941288819549, 'samples': 580224, 'steps': 3021, 'loss/train': 1.5361846685409546} +11/06/2021 21:41:26 - INFO - __main__ - Step 3023: {'lr': 0.0004999411737605313, 'samples': 580416, 'steps': 3022, 'loss/train': 1.946350336074829} +11/06/2021 21:41:27 - INFO - __main__ - Step 3024: {'lr': 0.000499941058588894, 'samples': 580608, 'steps': 3023, 'loss/train': 2.60408091545105} +11/06/2021 21:41:28 - INFO - __main__ - Step 3025: {'lr': 0.0004999409433046371, 'samples': 580800, 'steps': 3024, 'loss/train': 2.4534120559692383} +11/06/2021 21:41:28 - INFO - __main__ - Step 3026: {'lr': 0.0004999408279077607, 'samples': 580992, 'steps': 3025, 'loss/train': 2.68884015083313} +11/06/2021 21:41:29 - INFO - __main__ - Step 3027: {'lr': 0.0004999407123982649, 'samples': 581184, 'steps': 3026, 'loss/train': 2.0190529823303223} +11/06/2021 21:41:29 - INFO - __main__ - Step 3028: {'lr': 0.0004999405967761495, 'samples': 581376, 'steps': 3027, 'loss/train': 1.0339617729187012} +11/06/2021 21:41:29 - INFO - __main__ - Step 3029: {'lr': 0.0004999404810414149, 'samples': 581568, 'steps': 3028, 'loss/train': 0.895268440246582} +11/06/2021 21:41:31 - INFO - __main__ - Step 3030: {'lr': 0.0004999403651940608, 'samples': 581760, 'steps': 3029, 'loss/train': 2.5212795734405518} +11/06/2021 21:41:31 - INFO - __main__ - Step 3031: {'lr': 0.0004999402492340875, 'samples': 581952, 'steps': 3030, 'loss/train': 2.4372713565826416} +11/06/2021 21:41:31 - INFO - __main__ - Step 3032: {'lr': 0.000499940133161495, 'samples': 582144, 'steps': 3031, 'loss/train': 2.357042074203491} +11/06/2021 21:41:32 - INFO - __main__ - Step 3033: {'lr': 0.0004999400169762834, 'samples': 582336, 'steps': 3032, 'loss/train': 1.6500097513198853} +11/06/2021 21:41:32 - INFO - __main__ - Step 3034: {'lr': 0.0004999399006784525, 'samples': 582528, 'steps': 3033, 'loss/train': 2.2816481590270996} +11/06/2021 21:41:33 - INFO - __main__ - Step 3035: {'lr': 0.0004999397842680027, 'samples': 582720, 'steps': 3034, 'loss/train': 2.364650249481201} +11/06/2021 21:41:33 - INFO - __main__ - Step 3036: {'lr': 0.0004999396677449338, 'samples': 582912, 'steps': 3035, 'loss/train': 0.6538060307502747} +11/06/2021 21:41:34 - INFO - __main__ - Step 3037: {'lr': 0.000499939551109246, 'samples': 583104, 'steps': 3036, 'loss/train': 2.646855354309082} +11/06/2021 21:41:34 - INFO - __main__ - Step 3038: {'lr': 0.0004999394343609393, 'samples': 583296, 'steps': 3037, 'loss/train': 2.262348175048828} +11/06/2021 21:41:34 - INFO - __main__ - Step 3039: {'lr': 0.0004999393175000137, 'samples': 583488, 'steps': 3038, 'loss/train': 2.1946680545806885} +11/06/2021 21:41:35 - INFO - __main__ - Step 3040: {'lr': 0.0004999392005264694, 'samples': 583680, 'steps': 3039, 'loss/train': 2.3588778972625732} +11/06/2021 21:41:36 - INFO - __main__ - Step 3041: {'lr': 0.0004999390834403062, 'samples': 583872, 'steps': 3040, 'loss/train': 1.918365716934204} +11/06/2021 21:41:36 - INFO - __main__ - Step 3042: {'lr': 0.0004999389662415244, 'samples': 584064, 'steps': 3041, 'loss/train': 2.238910436630249} +11/06/2021 21:41:37 - INFO - __main__ - Step 3043: {'lr': 0.000499938848930124, 'samples': 584256, 'steps': 3042, 'loss/train': 1.9267772436141968} +11/06/2021 21:41:37 - INFO - __main__ - Step 3044: {'lr': 0.0004999387315061049, 'samples': 584448, 'steps': 3043, 'loss/train': 2.763803005218506} +11/06/2021 21:41:37 - INFO - __main__ - Step 3045: {'lr': 0.0004999386139694673, 'samples': 584640, 'steps': 3044, 'loss/train': 5.723489761352539} +11/06/2021 21:41:38 - INFO - __main__ - Step 3046: {'lr': 0.0004999384963202113, 'samples': 584832, 'steps': 3045, 'loss/train': 2.657350778579712} +11/06/2021 21:41:39 - INFO - __main__ - Step 3047: {'lr': 0.0004999383785583368, 'samples': 585024, 'steps': 3046, 'loss/train': 2.1708598136901855} +11/06/2021 21:41:39 - INFO - __main__ - Step 3048: {'lr': 0.0004999382606838439, 'samples': 585216, 'steps': 3047, 'loss/train': 2.4225125312805176} +11/06/2021 21:41:39 - INFO - __main__ - Step 3049: {'lr': 0.0004999381426967327, 'samples': 585408, 'steps': 3048, 'loss/train': 2.1795241832733154} +11/06/2021 21:41:40 - INFO - __main__ - Step 3050: {'lr': 0.0004999380245970033, 'samples': 585600, 'steps': 3049, 'loss/train': 2.3345532417297363} +11/06/2021 21:41:40 - INFO - __main__ - Step 3051: {'lr': 0.0004999379063846555, 'samples': 585792, 'steps': 3050, 'loss/train': 2.1658904552459717} +11/06/2021 21:41:41 - INFO - __main__ - Step 3052: {'lr': 0.0004999377880596897, 'samples': 585984, 'steps': 3051, 'loss/train': 2.3104407787323} +11/06/2021 21:41:41 - INFO - __main__ - Step 3053: {'lr': 0.0004999376696221057, 'samples': 586176, 'steps': 3052, 'loss/train': 2.1022863388061523} +11/06/2021 21:41:42 - INFO - __main__ - Step 3054: {'lr': 0.0004999375510719037, 'samples': 586368, 'steps': 3053, 'loss/train': 2.1373109817504883} +11/06/2021 21:41:42 - INFO - __main__ - Step 3055: {'lr': 0.0004999374324090837, 'samples': 586560, 'steps': 3054, 'loss/train': 2.6458959579467773} +11/06/2021 21:41:43 - INFO - __main__ - Step 3056: {'lr': 0.0004999373136336457, 'samples': 586752, 'steps': 3055, 'loss/train': 2.1818501949310303} +11/06/2021 21:41:44 - INFO - __main__ - Step 3057: {'lr': 0.0004999371947455899, 'samples': 586944, 'steps': 3056, 'loss/train': 3.2870852947235107} +11/06/2021 21:41:44 - INFO - __main__ - Step 3058: {'lr': 0.0004999370757449162, 'samples': 587136, 'steps': 3057, 'loss/train': 1.6503088474273682} +11/06/2021 21:41:45 - INFO - __main__ - Step 3059: {'lr': 0.0004999369566316247, 'samples': 587328, 'steps': 3058, 'loss/train': 3.2985236644744873} +11/06/2021 21:41:45 - INFO - __main__ - Step 3060: {'lr': 0.0004999368374057155, 'samples': 587520, 'steps': 3059, 'loss/train': 2.637629985809326} +11/06/2021 21:41:45 - INFO - __main__ - Step 3061: {'lr': 0.0004999367180671886, 'samples': 587712, 'steps': 3060, 'loss/train': 2.058300733566284} +11/06/2021 21:41:46 - INFO - __main__ - Step 3062: {'lr': 0.000499936598616044, 'samples': 587904, 'steps': 3061, 'loss/train': 2.2234086990356445} +11/06/2021 21:41:46 - INFO - __main__ - Step 3063: {'lr': 0.0004999364790522819, 'samples': 588096, 'steps': 3062, 'loss/train': 1.9552711248397827} +11/06/2021 21:41:47 - INFO - __main__ - Step 3064: {'lr': 0.0004999363593759022, 'samples': 588288, 'steps': 3063, 'loss/train': 2.5826447010040283} +11/06/2021 21:41:47 - INFO - __main__ - Step 3065: {'lr': 0.0004999362395869052, 'samples': 588480, 'steps': 3064, 'loss/train': 2.5143256187438965} +11/06/2021 21:41:48 - INFO - __main__ - Step 3066: {'lr': 0.0004999361196852906, 'samples': 588672, 'steps': 3065, 'loss/train': 2.092707633972168} +11/06/2021 21:41:48 - INFO - __main__ - Step 3067: {'lr': 0.0004999359996710588, 'samples': 588864, 'steps': 3066, 'loss/train': 2.1652286052703857} +11/06/2021 21:41:49 - INFO - __main__ - Step 3068: {'lr': 0.0004999358795442096, 'samples': 589056, 'steps': 3067, 'loss/train': 2.3341615200042725} +11/06/2021 21:41:50 - INFO - __main__ - Step 3069: {'lr': 0.0004999357593047431, 'samples': 589248, 'steps': 3068, 'loss/train': 1.7487068176269531} +11/06/2021 21:41:50 - INFO - __main__ - Step 3070: {'lr': 0.0004999356389526595, 'samples': 589440, 'steps': 3069, 'loss/train': 2.2745633125305176} +11/06/2021 21:41:50 - INFO - __main__ - Step 3071: {'lr': 0.0004999355184879587, 'samples': 589632, 'steps': 3070, 'loss/train': 1.911078691482544} +11/06/2021 21:41:51 - INFO - __main__ - Step 3072: {'lr': 0.0004999353979106409, 'samples': 589824, 'steps': 3071, 'loss/train': 2.032170057296753} +11/06/2021 21:41:52 - INFO - __main__ - Step 3073: {'lr': 0.000499935277220706, 'samples': 590016, 'steps': 3072, 'loss/train': 0.5505169034004211} +11/06/2021 21:41:52 - INFO - __main__ - Step 3074: {'lr': 0.0004999351564181541, 'samples': 590208, 'steps': 3073, 'loss/train': 2.0557284355163574} +11/06/2021 21:41:53 - INFO - __main__ - Step 3075: {'lr': 0.0004999350355029854, 'samples': 590400, 'steps': 3074, 'loss/train': 2.871734857559204} +11/06/2021 21:41:53 - INFO - __main__ - Step 3076: {'lr': 0.0004999349144751997, 'samples': 590592, 'steps': 3075, 'loss/train': 2.093614339828491} +11/06/2021 21:41:53 - INFO - __main__ - Step 3077: {'lr': 0.0004999347933347972, 'samples': 590784, 'steps': 3076, 'loss/train': 2.2639260292053223} +11/06/2021 21:41:55 - INFO - __main__ - Step 3078: {'lr': 0.0004999346720817779, 'samples': 590976, 'steps': 3077, 'loss/train': 1.5730407238006592} +11/06/2021 21:41:55 - INFO - __main__ - Step 3079: {'lr': 0.000499934550716142, 'samples': 591168, 'steps': 3078, 'loss/train': 2.4267160892486572} +11/06/2021 21:41:55 - INFO - __main__ - Step 3080: {'lr': 0.0004999344292378893, 'samples': 591360, 'steps': 3079, 'loss/train': 3.6418893337249756} +11/06/2021 21:41:56 - INFO - __main__ - Step 3081: {'lr': 0.0004999343076470202, 'samples': 591552, 'steps': 3080, 'loss/train': 1.6918516159057617} +11/06/2021 21:41:56 - INFO - __main__ - Step 3082: {'lr': 0.0004999341859435345, 'samples': 591744, 'steps': 3081, 'loss/train': 2.610215902328491} +11/06/2021 21:41:57 - INFO - __main__ - Step 3083: {'lr': 0.0004999340641274322, 'samples': 591936, 'steps': 3082, 'loss/train': 2.330768346786499} +11/06/2021 21:41:57 - INFO - __main__ - Step 3084: {'lr': 0.0004999339421987136, 'samples': 592128, 'steps': 3083, 'loss/train': 1.9727678298950195} +11/06/2021 21:41:58 - INFO - __main__ - Step 3085: {'lr': 0.0004999338201573786, 'samples': 592320, 'steps': 3084, 'loss/train': 2.6285154819488525} +11/06/2021 21:41:58 - INFO - __main__ - Step 3086: {'lr': 0.0004999336980034271, 'samples': 592512, 'steps': 3085, 'loss/train': 2.5483882427215576} +11/06/2021 21:41:59 - INFO - __main__ - Step 3087: {'lr': 0.0004999335757368595, 'samples': 592704, 'steps': 3086, 'loss/train': 2.4830641746520996} +11/06/2021 21:41:59 - INFO - __main__ - Step 3088: {'lr': 0.0004999334533576757, 'samples': 592896, 'steps': 3087, 'loss/train': 2.06929087638855} +11/06/2021 21:41:59 - INFO - __main__ - Step 3089: {'lr': 0.0004999333308658756, 'samples': 593088, 'steps': 3088, 'loss/train': 2.439222812652588} +11/06/2021 21:42:01 - INFO - __main__ - Step 3090: {'lr': 0.0004999332082614597, 'samples': 593280, 'steps': 3089, 'loss/train': 1.6735726594924927} +11/06/2021 21:42:01 - INFO - __main__ - Step 3091: {'lr': 0.0004999330855444274, 'samples': 593472, 'steps': 3090, 'loss/train': 2.4830446243286133} +11/06/2021 21:42:01 - INFO - __main__ - Step 3092: {'lr': 0.0004999329627147792, 'samples': 593664, 'steps': 3091, 'loss/train': 1.9454426765441895} +11/06/2021 21:42:02 - INFO - __main__ - Step 3093: {'lr': 0.0004999328397725152, 'samples': 593856, 'steps': 3092, 'loss/train': 2.445350408554077} +11/06/2021 21:42:02 - INFO - __main__ - Step 3094: {'lr': 0.0004999327167176352, 'samples': 594048, 'steps': 3093, 'loss/train': 2.219423532485962} +11/06/2021 21:42:02 - INFO - __main__ - Step 3095: {'lr': 0.0004999325935501395, 'samples': 594240, 'steps': 3094, 'loss/train': 2.2615649700164795} +11/06/2021 21:42:03 - INFO - __main__ - Step 3096: {'lr': 0.0004999324702700279, 'samples': 594432, 'steps': 3095, 'loss/train': 2.060243844985962} +11/06/2021 21:42:04 - INFO - __main__ - Step 3097: {'lr': 0.0004999323468773007, 'samples': 594624, 'steps': 3096, 'loss/train': 1.7364767789840698} +11/06/2021 21:42:04 - INFO - __main__ - Step 3098: {'lr': 0.0004999322233719578, 'samples': 594816, 'steps': 3097, 'loss/train': 2.3466086387634277} +11/06/2021 21:42:04 - INFO - __main__ - Step 3099: {'lr': 0.0004999320997539992, 'samples': 595008, 'steps': 3098, 'loss/train': 2.1478734016418457} +11/06/2021 21:42:05 - INFO - __main__ - Step 3100: {'lr': 0.0004999319760234251, 'samples': 595200, 'steps': 3099, 'loss/train': 1.8214367628097534} +11/06/2021 21:42:06 - INFO - __main__ - Step 3101: {'lr': 0.0004999318521802356, 'samples': 595392, 'steps': 3100, 'loss/train': 2.0618221759796143} +11/06/2021 21:42:06 - INFO - __main__ - Step 3102: {'lr': 0.0004999317282244305, 'samples': 595584, 'steps': 3101, 'loss/train': 2.218130350112915} +11/06/2021 21:42:07 - INFO - __main__ - Step 3103: {'lr': 0.0004999316041560102, 'samples': 595776, 'steps': 3102, 'loss/train': 1.9381036758422852} +11/06/2021 21:42:07 - INFO - __main__ - Step 3104: {'lr': 0.0004999314799749745, 'samples': 595968, 'steps': 3103, 'loss/train': 3.2617650032043457} +11/06/2021 21:42:07 - INFO - __main__ - Step 3105: {'lr': 0.0004999313556813235, 'samples': 596160, 'steps': 3104, 'loss/train': 2.255150079727173} +11/06/2021 21:42:08 - INFO - __main__ - Step 3106: {'lr': 0.0004999312312750573, 'samples': 596352, 'steps': 3105, 'loss/train': 1.6376298666000366} +11/06/2021 21:42:09 - INFO - __main__ - Step 3107: {'lr': 0.000499931106756176, 'samples': 596544, 'steps': 3106, 'loss/train': 2.3858001232147217} +11/06/2021 21:42:09 - INFO - __main__ - Step 3108: {'lr': 0.0004999309821246795, 'samples': 596736, 'steps': 3107, 'loss/train': 2.6677393913269043} +11/06/2021 21:42:10 - INFO - __main__ - Step 3109: {'lr': 0.000499930857380568, 'samples': 596928, 'steps': 3108, 'loss/train': 1.4987972974777222} +11/06/2021 21:42:10 - INFO - __main__ - Step 3110: {'lr': 0.0004999307325238416, 'samples': 597120, 'steps': 3109, 'loss/train': 1.9903048276901245} +11/06/2021 21:42:10 - INFO - __main__ - Step 3111: {'lr': 0.0004999306075545002, 'samples': 597312, 'steps': 3110, 'loss/train': 2.7295010089874268} +11/06/2021 21:42:11 - INFO - __main__ - Step 3112: {'lr': 0.0004999304824725439, 'samples': 597504, 'steps': 3111, 'loss/train': 2.1662516593933105} +11/06/2021 21:42:12 - INFO - __main__ - Step 3113: {'lr': 0.0004999303572779727, 'samples': 597696, 'steps': 3112, 'loss/train': 1.8486442565917969} +11/06/2021 21:42:12 - INFO - __main__ - Step 3114: {'lr': 0.0004999302319707869, 'samples': 597888, 'steps': 3113, 'loss/train': 2.575617551803589} +11/06/2021 21:42:12 - INFO - __main__ - Step 3115: {'lr': 0.0004999301065509863, 'samples': 598080, 'steps': 3114, 'loss/train': 2.4557383060455322} +11/06/2021 21:42:13 - INFO - __main__ - Step 3116: {'lr': 0.0004999299810185712, 'samples': 598272, 'steps': 3115, 'loss/train': 1.887520670890808} +11/06/2021 21:42:14 - INFO - __main__ - Step 3117: {'lr': 0.0004999298553735413, 'samples': 598464, 'steps': 3116, 'loss/train': 2.2960591316223145} +11/06/2021 21:42:14 - INFO - __main__ - Step 3118: {'lr': 0.000499929729615897, 'samples': 598656, 'steps': 3117, 'loss/train': 2.5776569843292236} +11/06/2021 21:42:14 - INFO - __main__ - Step 3119: {'lr': 0.0004999296037456381, 'samples': 598848, 'steps': 3118, 'loss/train': 2.3189525604248047} +11/06/2021 21:42:15 - INFO - __main__ - Step 3120: {'lr': 0.0004999294777627649, 'samples': 599040, 'steps': 3119, 'loss/train': 1.3478337526321411} +11/06/2021 21:42:15 - INFO - __main__ - Step 3121: {'lr': 0.0004999293516672773, 'samples': 599232, 'steps': 3120, 'loss/train': 2.864377021789551} +11/06/2021 21:42:16 - INFO - __main__ - Step 3122: {'lr': 0.0004999292254591754, 'samples': 599424, 'steps': 3121, 'loss/train': 2.7079334259033203} +11/06/2021 21:42:16 - INFO - __main__ - Step 3123: {'lr': 0.0004999290991384591, 'samples': 599616, 'steps': 3122, 'loss/train': 2.133533477783203} +11/06/2021 21:42:17 - INFO - __main__ - Step 3124: {'lr': 0.0004999289727051289, 'samples': 599808, 'steps': 3123, 'loss/train': 2.1969847679138184} +11/06/2021 21:42:17 - INFO - __main__ - Step 3125: {'lr': 0.0004999288461591842, 'samples': 600000, 'steps': 3124, 'loss/train': 1.7113127708435059} +11/06/2021 21:42:17 - INFO - __main__ - Step 3126: {'lr': 0.0004999287195006257, 'samples': 600192, 'steps': 3125, 'loss/train': 2.617366313934326} +11/06/2021 21:42:19 - INFO - __main__ - Step 3127: {'lr': 0.000499928592729453, 'samples': 600384, 'steps': 3126, 'loss/train': 2.459381103515625} +11/06/2021 21:42:19 - INFO - __main__ - Step 3128: {'lr': 0.0004999284658456665, 'samples': 600576, 'steps': 3127, 'loss/train': 2.3718807697296143} +11/06/2021 21:42:19 - INFO - __main__ - Step 3129: {'lr': 0.000499928338849266, 'samples': 600768, 'steps': 3128, 'loss/train': 2.543180465698242} +11/06/2021 21:42:20 - INFO - __main__ - Step 3130: {'lr': 0.0004999282117402516, 'samples': 600960, 'steps': 3129, 'loss/train': 1.7423886060714722} +11/06/2021 21:42:20 - INFO - __main__ - Step 3131: {'lr': 0.0004999280845186235, 'samples': 601152, 'steps': 3130, 'loss/train': 2.2052173614501953} +11/06/2021 21:42:21 - INFO - __main__ - Step 3132: {'lr': 0.0004999279571843816, 'samples': 601344, 'steps': 3131, 'loss/train': 1.9484204053878784} +11/06/2021 21:42:22 - INFO - __main__ - Step 3133: {'lr': 0.000499927829737526, 'samples': 601536, 'steps': 3132, 'loss/train': 2.428269147872925} +11/06/2021 21:42:22 - INFO - __main__ - Step 3134: {'lr': 0.0004999277021780569, 'samples': 601728, 'steps': 3133, 'loss/train': 2.089491128921509} +11/06/2021 21:42:22 - INFO - __main__ - Step 3135: {'lr': 0.0004999275745059741, 'samples': 601920, 'steps': 3134, 'loss/train': 2.9237546920776367} +11/06/2021 21:42:23 - INFO - __main__ - Step 3136: {'lr': 0.0004999274467212779, 'samples': 602112, 'steps': 3135, 'loss/train': 2.297293186187744} +11/06/2021 21:42:23 - INFO - __main__ - Step 3137: {'lr': 0.0004999273188239681, 'samples': 602304, 'steps': 3136, 'loss/train': 2.1000170707702637} +11/06/2021 21:42:24 - INFO - __main__ - Step 3138: {'lr': 0.0004999271908140451, 'samples': 602496, 'steps': 3137, 'loss/train': 2.391845703125} +11/06/2021 21:42:24 - INFO - __main__ - Step 3139: {'lr': 0.0004999270626915086, 'samples': 602688, 'steps': 3138, 'loss/train': 2.167910099029541} +11/06/2021 21:42:25 - INFO - __main__ - Step 3140: {'lr': 0.0004999269344563589, 'samples': 602880, 'steps': 3139, 'loss/train': 2.10351300239563} +11/06/2021 21:42:25 - INFO - __main__ - Step 3141: {'lr': 0.0004999268061085959, 'samples': 603072, 'steps': 3140, 'loss/train': 2.418550968170166} +11/06/2021 21:42:25 - INFO - __main__ - Step 3142: {'lr': 0.0004999266776482199, 'samples': 603264, 'steps': 3141, 'loss/train': 2.0939297676086426} +11/06/2021 21:42:27 - INFO - __main__ - Step 3143: {'lr': 0.0004999265490752306, 'samples': 603456, 'steps': 3142, 'loss/train': 2.4321014881134033} +11/06/2021 21:42:27 - INFO - __main__ - Step 3144: {'lr': 0.0004999264203896284, 'samples': 603648, 'steps': 3143, 'loss/train': 2.1129066944122314} +11/06/2021 21:42:27 - INFO - __main__ - Step 3145: {'lr': 0.0004999262915914132, 'samples': 603840, 'steps': 3144, 'loss/train': 1.9223228693008423} +11/06/2021 21:42:28 - INFO - __main__ - Step 3146: {'lr': 0.000499926162680585, 'samples': 604032, 'steps': 3145, 'loss/train': 1.9708632230758667} +11/06/2021 21:42:28 - INFO - __main__ - Step 3147: {'lr': 0.000499926033657144, 'samples': 604224, 'steps': 3146, 'loss/train': 2.535964250564575} +11/06/2021 21:42:29 - INFO - __main__ - Step 3148: {'lr': 0.0004999259045210901, 'samples': 604416, 'steps': 3147, 'loss/train': 1.4385805130004883} +11/06/2021 21:42:29 - INFO - __main__ - Step 3149: {'lr': 0.0004999257752724234, 'samples': 604608, 'steps': 3148, 'loss/train': 2.0960731506347656} +11/06/2021 21:42:30 - INFO - __main__ - Step 3150: {'lr': 0.0004999256459111443, 'samples': 604800, 'steps': 3149, 'loss/train': 1.577193021774292} +11/06/2021 21:42:30 - INFO - __main__ - Step 3151: {'lr': 0.0004999255164372523, 'samples': 604992, 'steps': 3150, 'loss/train': 1.8809454441070557} +11/06/2021 21:42:30 - INFO - __main__ - Step 3152: {'lr': 0.0004999253868507476, 'samples': 605184, 'steps': 3151, 'loss/train': 2.5812270641326904} +11/06/2021 21:42:31 - INFO - __main__ - Step 3153: {'lr': 0.0004999252571516306, 'samples': 605376, 'steps': 3152, 'loss/train': 2.324453353881836} +11/06/2021 21:42:32 - INFO - __main__ - Step 3154: {'lr': 0.0004999251273399011, 'samples': 605568, 'steps': 3153, 'loss/train': 1.5840191841125488} +11/06/2021 21:42:32 - INFO - __main__ - Step 3155: {'lr': 0.0004999249974155592, 'samples': 605760, 'steps': 3154, 'loss/train': 2.419705390930176} +11/06/2021 21:42:33 - INFO - __main__ - Step 3156: {'lr': 0.0004999248673786049, 'samples': 605952, 'steps': 3155, 'loss/train': 1.7660547494888306} +11/06/2021 21:42:33 - INFO - __main__ - Step 3157: {'lr': 0.0004999247372290383, 'samples': 606144, 'steps': 3156, 'loss/train': 3.5126683712005615} +11/06/2021 21:42:33 - INFO - __main__ - Step 3158: {'lr': 0.0004999246069668596, 'samples': 606336, 'steps': 3157, 'loss/train': 2.0734901428222656} +11/06/2021 21:42:34 - INFO - __main__ - Step 3159: {'lr': 0.0004999244765920687, 'samples': 606528, 'steps': 3158, 'loss/train': 2.5572397708892822} +11/06/2021 21:42:35 - INFO - __main__ - Step 3160: {'lr': 0.0004999243461046656, 'samples': 606720, 'steps': 3159, 'loss/train': 1.9452892541885376} +11/06/2021 21:42:35 - INFO - __main__ - Step 3161: {'lr': 0.0004999242155046504, 'samples': 606912, 'steps': 3160, 'loss/train': 0.912672221660614} +11/06/2021 21:42:35 - INFO - __main__ - Step 3162: {'lr': 0.0004999240847920233, 'samples': 607104, 'steps': 3161, 'loss/train': 1.7738767862319946} +11/06/2021 21:42:36 - INFO - __main__ - Step 3163: {'lr': 0.0004999239539667842, 'samples': 607296, 'steps': 3162, 'loss/train': 1.6333916187286377} +11/06/2021 21:42:37 - INFO - __main__ - Step 3164: {'lr': 0.0004999238230289333, 'samples': 607488, 'steps': 3163, 'loss/train': 2.6016409397125244} +11/06/2021 21:42:37 - INFO - __main__ - Step 3165: {'lr': 0.0004999236919784705, 'samples': 607680, 'steps': 3164, 'loss/train': 2.146538734436035} +11/06/2021 21:42:37 - INFO - __main__ - Step 3166: {'lr': 0.0004999235608153961, 'samples': 607872, 'steps': 3165, 'loss/train': 1.9972015619277954} +11/06/2021 21:42:38 - INFO - __main__ - Step 3167: {'lr': 0.0004999234295397098, 'samples': 608064, 'steps': 3166, 'loss/train': 2.117999315261841} +11/06/2021 21:42:38 - INFO - __main__ - Step 3168: {'lr': 0.000499923298151412, 'samples': 608256, 'steps': 3167, 'loss/train': 2.080382823944092} +11/06/2021 21:42:39 - INFO - __main__ - Step 3169: {'lr': 0.0004999231666505025, 'samples': 608448, 'steps': 3168, 'loss/train': 2.333287239074707} +11/06/2021 21:42:39 - INFO - __main__ - Step 3170: {'lr': 0.0004999230350369816, 'samples': 608640, 'steps': 3169, 'loss/train': 2.8902382850646973} +11/06/2021 21:42:40 - INFO - __main__ - Step 3171: {'lr': 0.0004999229033108492, 'samples': 608832, 'steps': 3170, 'loss/train': 1.6683903932571411} +11/06/2021 21:42:40 - INFO - __main__ - Step 3172: {'lr': 0.0004999227714721054, 'samples': 609024, 'steps': 3171, 'loss/train': 1.9496757984161377} +11/06/2021 21:42:40 - INFO - __main__ - Step 3173: {'lr': 0.0004999226395207501, 'samples': 609216, 'steps': 3172, 'loss/train': 2.0327744483947754} +11/06/2021 21:42:41 - INFO - __main__ - Step 3174: {'lr': 0.0004999225074567837, 'samples': 609408, 'steps': 3173, 'loss/train': 2.1947336196899414} +11/06/2021 21:42:42 - INFO - __main__ - Step 3175: {'lr': 0.000499922375280206, 'samples': 609600, 'steps': 3174, 'loss/train': 2.3255155086517334} +11/06/2021 21:42:42 - INFO - __main__ - Step 3176: {'lr': 0.0004999222429910171, 'samples': 609792, 'steps': 3175, 'loss/train': 2.275817394256592} +11/06/2021 21:42:42 - INFO - __main__ - Step 3177: {'lr': 0.0004999221105892172, 'samples': 609984, 'steps': 3176, 'loss/train': 2.14980411529541} +11/06/2021 21:42:43 - INFO - __main__ - Step 3178: {'lr': 0.0004999219780748062, 'samples': 610176, 'steps': 3177, 'loss/train': 3.107052803039551} +11/06/2021 21:42:44 - INFO - __main__ - Step 3179: {'lr': 0.0004999218454477843, 'samples': 610368, 'steps': 3178, 'loss/train': 1.9000006914138794} +11/06/2021 21:42:44 - INFO - __main__ - Step 3180: {'lr': 0.0004999217127081514, 'samples': 610560, 'steps': 3179, 'loss/train': 2.2246599197387695} +11/06/2021 21:42:44 - INFO - __main__ - Step 3181: {'lr': 0.0004999215798559076, 'samples': 610752, 'steps': 3180, 'loss/train': 2.3011488914489746} +11/06/2021 21:42:45 - INFO - __main__ - Step 3182: {'lr': 0.000499921446891053, 'samples': 610944, 'steps': 3181, 'loss/train': 2.965468168258667} +11/06/2021 21:42:45 - INFO - __main__ - Step 3183: {'lr': 0.0004999213138135877, 'samples': 611136, 'steps': 3182, 'loss/train': 2.451305389404297} +11/06/2021 21:42:46 - INFO - __main__ - Step 3184: {'lr': 0.0004999211806235117, 'samples': 611328, 'steps': 3183, 'loss/train': 2.616995334625244} +11/06/2021 21:42:47 - INFO - __main__ - Step 3185: {'lr': 0.000499921047320825, 'samples': 611520, 'steps': 3184, 'loss/train': 1.994917869567871} +11/06/2021 21:42:47 - INFO - __main__ - Step 3186: {'lr': 0.0004999209139055278, 'samples': 611712, 'steps': 3185, 'loss/train': 2.5971717834472656} +11/06/2021 21:42:47 - INFO - __main__ - Step 3187: {'lr': 0.0004999207803776201, 'samples': 611904, 'steps': 3186, 'loss/train': 2.031585693359375} +11/06/2021 21:42:48 - INFO - __main__ - Step 3188: {'lr': 0.000499920646737102, 'samples': 612096, 'steps': 3187, 'loss/train': 2.4705827236175537} +11/06/2021 21:42:48 - INFO - __main__ - Step 3189: {'lr': 0.0004999205129839734, 'samples': 612288, 'steps': 3188, 'loss/train': 2.301380157470703} +11/06/2021 21:42:49 - INFO - __main__ - Step 3190: {'lr': 0.0004999203791182345, 'samples': 612480, 'steps': 3189, 'loss/train': 2.5135273933410645} +11/06/2021 21:42:49 - INFO - __main__ - Step 3191: {'lr': 0.0004999202451398853, 'samples': 612672, 'steps': 3190, 'loss/train': 2.0862905979156494} +11/06/2021 21:42:50 - INFO - __main__ - Step 3192: {'lr': 0.000499920111048926, 'samples': 612864, 'steps': 3191, 'loss/train': 2.3521876335144043} +11/06/2021 21:42:50 - INFO - __main__ - Step 3193: {'lr': 0.0004999199768453565, 'samples': 613056, 'steps': 3192, 'loss/train': 5.900242328643799} +11/06/2021 21:42:50 - INFO - __main__ - Step 3194: {'lr': 0.0004999198425291769, 'samples': 613248, 'steps': 3193, 'loss/train': 2.1287336349487305} +11/06/2021 21:42:52 - INFO - __main__ - Step 3195: {'lr': 0.0004999197081003873, 'samples': 613440, 'steps': 3194, 'loss/train': 1.8804785013198853} +11/06/2021 21:42:52 - INFO - __main__ - Step 3196: {'lr': 0.0004999195735589877, 'samples': 613632, 'steps': 3195, 'loss/train': 2.1079533100128174} +11/06/2021 21:42:52 - INFO - __main__ - Step 3197: {'lr': 0.0004999194389049783, 'samples': 613824, 'steps': 3196, 'loss/train': 2.4482831954956055} +11/06/2021 21:42:53 - INFO - __main__ - Step 3198: {'lr': 0.0004999193041383588, 'samples': 614016, 'steps': 3197, 'loss/train': 2.2492079734802246} +11/06/2021 21:42:53 - INFO - __main__ - Step 3199: {'lr': 0.0004999191692591299, 'samples': 614208, 'steps': 3198, 'loss/train': 1.8088970184326172} +11/06/2021 21:42:54 - INFO - __main__ - Step 3200: {'lr': 0.000499919034267291, 'samples': 614400, 'steps': 3199, 'loss/train': 2.175657272338867} +11/06/2021 21:42:54 - INFO - __main__ - Step 3201: {'lr': 0.0004999188991628425, 'samples': 614592, 'steps': 3200, 'loss/train': 2.242400646209717} +11/06/2021 21:42:55 - INFO - __main__ - Step 3202: {'lr': 0.0004999187639457844, 'samples': 614784, 'steps': 3201, 'loss/train': 2.0254077911376953} +11/06/2021 21:42:55 - INFO - __main__ - Step 3203: {'lr': 0.0004999186286161169, 'samples': 614976, 'steps': 3202, 'loss/train': 2.909585952758789} +11/06/2021 21:42:55 - INFO - __main__ - Step 3204: {'lr': 0.0004999184931738397, 'samples': 615168, 'steps': 3203, 'loss/train': 1.7180776596069336} +11/06/2021 21:42:56 - INFO - __main__ - Step 3205: {'lr': 0.0004999183576189532, 'samples': 615360, 'steps': 3204, 'loss/train': 2.3504021167755127} +11/06/2021 21:42:57 - INFO - __main__ - Step 3206: {'lr': 0.0004999182219514573, 'samples': 615552, 'steps': 3205, 'loss/train': 2.0548884868621826} +11/06/2021 21:42:57 - INFO - __main__ - Step 3207: {'lr': 0.0004999180861713522, 'samples': 615744, 'steps': 3206, 'loss/train': 2.1941933631896973} +11/06/2021 21:42:58 - INFO - __main__ - Step 3208: {'lr': 0.0004999179502786377, 'samples': 615936, 'steps': 3207, 'loss/train': 6.997474193572998} +11/06/2021 21:42:58 - INFO - __main__ - Step 3209: {'lr': 0.0004999178142733141, 'samples': 616128, 'steps': 3208, 'loss/train': 2.0363223552703857} +11/06/2021 21:42:59 - INFO - __main__ - Step 3210: {'lr': 0.0004999176781553815, 'samples': 616320, 'steps': 3209, 'loss/train': 2.108640432357788} +11/06/2021 21:42:59 - INFO - __main__ - Step 3211: {'lr': 0.0004999175419248398, 'samples': 616512, 'steps': 3210, 'loss/train': 2.0920512676239014} +11/06/2021 21:43:00 - INFO - __main__ - Step 3212: {'lr': 0.0004999174055816891, 'samples': 616704, 'steps': 3211, 'loss/train': 2.339956760406494} +11/06/2021 21:43:00 - INFO - __main__ - Step 3213: {'lr': 0.0004999172691259293, 'samples': 616896, 'steps': 3212, 'loss/train': 1.8541127443313599} +11/06/2021 21:43:01 - INFO - __main__ - Step 3214: {'lr': 0.0004999171325575609, 'samples': 617088, 'steps': 3213, 'loss/train': 1.9735697507858276} +11/06/2021 21:43:01 - INFO - __main__ - Step 3215: {'lr': 0.0004999169958765836, 'samples': 617280, 'steps': 3214, 'loss/train': 2.325428009033203} +11/06/2021 21:43:02 - INFO - __main__ - Step 3216: {'lr': 0.0004999168590829975, 'samples': 617472, 'steps': 3215, 'loss/train': 2.0824670791625977} +11/06/2021 21:43:02 - INFO - __main__ - Step 3217: {'lr': 0.0004999167221768028, 'samples': 617664, 'steps': 3216, 'loss/train': 2.0834946632385254} +11/06/2021 21:43:03 - INFO - __main__ - Step 3218: {'lr': 0.0004999165851579994, 'samples': 617856, 'steps': 3217, 'loss/train': 1.993496060371399} +11/06/2021 21:43:03 - INFO - __main__ - Step 3219: {'lr': 0.0004999164480265875, 'samples': 618048, 'steps': 3218, 'loss/train': 2.200866460800171} +11/06/2021 21:43:03 - INFO - __main__ - Step 3220: {'lr': 0.0004999163107825671, 'samples': 618240, 'steps': 3219, 'loss/train': 2.439110040664673} +11/06/2021 21:43:04 - INFO - __main__ - Step 3221: {'lr': 0.0004999161734259383, 'samples': 618432, 'steps': 3220, 'loss/train': 1.0018621683120728} +11/06/2021 21:43:05 - INFO - __main__ - Step 3222: {'lr': 0.0004999160359567011, 'samples': 618624, 'steps': 3221, 'loss/train': 1.9945106506347656} +11/06/2021 21:43:05 - INFO - __main__ - Step 3223: {'lr': 0.0004999158983748555, 'samples': 618816, 'steps': 3222, 'loss/train': 2.565582036972046} +11/06/2021 21:43:06 - INFO - __main__ - Step 3224: {'lr': 0.0004999157606804018, 'samples': 619008, 'steps': 3223, 'loss/train': 2.3982090950012207} +11/06/2021 21:43:06 - INFO - __main__ - Step 3225: {'lr': 0.0004999156228733398, 'samples': 619200, 'steps': 3224, 'loss/train': 2.0050203800201416} +11/06/2021 21:43:07 - INFO - __main__ - Step 3226: {'lr': 0.0004999154849536698, 'samples': 619392, 'steps': 3225, 'loss/train': 2.3978424072265625} +11/06/2021 21:43:07 - INFO - __main__ - Step 3227: {'lr': 0.0004999153469213917, 'samples': 619584, 'steps': 3226, 'loss/train': 1.5546318292617798} +11/06/2021 21:43:08 - INFO - __main__ - Step 3228: {'lr': 0.0004999152087765055, 'samples': 619776, 'steps': 3227, 'loss/train': 1.9464197158813477} +11/06/2021 21:43:08 - INFO - __main__ - Step 3229: {'lr': 0.0004999150705190114, 'samples': 619968, 'steps': 3228, 'loss/train': 2.4329493045806885} +11/06/2021 21:43:08 - INFO - __main__ - Step 3230: {'lr': 0.0004999149321489095, 'samples': 620160, 'steps': 3229, 'loss/train': 3.806713581085205} +11/06/2021 21:43:09 - INFO - __main__ - Step 3231: {'lr': 0.0004999147936661997, 'samples': 620352, 'steps': 3230, 'loss/train': 1.9667352437973022} +11/06/2021 21:43:10 - INFO - __main__ - Step 3232: {'lr': 0.0004999146550708822, 'samples': 620544, 'steps': 3231, 'loss/train': 2.300558567047119} +11/06/2021 21:43:10 - INFO - __main__ - Step 3233: {'lr': 0.000499914516362957, 'samples': 620736, 'steps': 3232, 'loss/train': 1.624573826789856} +11/06/2021 21:43:10 - INFO - __main__ - Step 3234: {'lr': 0.0004999143775424241, 'samples': 620928, 'steps': 3233, 'loss/train': 2.1690218448638916} +11/06/2021 21:43:11 - INFO - __main__ - Step 3235: {'lr': 0.0004999142386092838, 'samples': 621120, 'steps': 3234, 'loss/train': 1.306965708732605} +11/06/2021 21:43:12 - INFO - __main__ - Step 3236: {'lr': 0.000499914099563536, 'samples': 621312, 'steps': 3235, 'loss/train': 2.066814422607422} +11/06/2021 21:43:12 - INFO - __main__ - Step 3237: {'lr': 0.0004999139604051806, 'samples': 621504, 'steps': 3236, 'loss/train': 2.289586305618286} +11/06/2021 21:43:12 - INFO - __main__ - Step 3238: {'lr': 0.0004999138211342179, 'samples': 621696, 'steps': 3237, 'loss/train': 2.0394601821899414} +11/06/2021 21:43:13 - INFO - __main__ - Step 3239: {'lr': 0.0004999136817506478, 'samples': 621888, 'steps': 3238, 'loss/train': 2.375570297241211} +11/06/2021 21:43:13 - INFO - __main__ - Step 3240: {'lr': 0.0004999135422544707, 'samples': 622080, 'steps': 3239, 'loss/train': 1.8367230892181396} +11/06/2021 21:43:14 - INFO - __main__ - Step 3241: {'lr': 0.0004999134026456862, 'samples': 622272, 'steps': 3240, 'loss/train': 2.2936620712280273} +11/06/2021 21:43:14 - INFO - __main__ - Step 3242: {'lr': 0.0004999132629242946, 'samples': 622464, 'steps': 3241, 'loss/train': 2.675550937652588} +11/06/2021 21:43:15 - INFO - __main__ - Step 3243: {'lr': 0.000499913123090296, 'samples': 622656, 'steps': 3242, 'loss/train': 2.318620204925537} +11/06/2021 21:43:15 - INFO - __main__ - Step 3244: {'lr': 0.0004999129831436904, 'samples': 622848, 'steps': 3243, 'loss/train': 2.7929880619049072} +11/06/2021 21:43:15 - INFO - __main__ - Step 3245: {'lr': 0.0004999128430844778, 'samples': 623040, 'steps': 3244, 'loss/train': 1.8520056009292603} +11/06/2021 21:43:16 - INFO - __main__ - Step 3246: {'lr': 0.0004999127029126585, 'samples': 623232, 'steps': 3245, 'loss/train': 1.9427516460418701} +11/06/2021 21:43:17 - INFO - __main__ - Step 3247: {'lr': 0.0004999125626282322, 'samples': 623424, 'steps': 3246, 'loss/train': 2.054605484008789} +11/06/2021 21:43:17 - INFO - __main__ - Step 3248: {'lr': 0.0004999124222311993, 'samples': 623616, 'steps': 3247, 'loss/train': 1.6573278903961182} +11/06/2021 21:43:17 - INFO - __main__ - Step 3249: {'lr': 0.0004999122817215595, 'samples': 623808, 'steps': 3248, 'loss/train': 1.8662605285644531} +11/06/2021 21:43:18 - INFO - __main__ - Step 3250: {'lr': 0.0004999121410993133, 'samples': 624000, 'steps': 3249, 'loss/train': 2.0213828086853027} +11/06/2021 21:43:19 - INFO - __main__ - Step 3251: {'lr': 0.0004999120003644604, 'samples': 624192, 'steps': 3250, 'loss/train': 2.3014163970947266} +11/06/2021 21:43:19 - INFO - __main__ - Step 3252: {'lr': 0.0004999118595170011, 'samples': 624384, 'steps': 3251, 'loss/train': 2.2614598274230957} +11/06/2021 21:43:20 - INFO - __main__ - Step 3253: {'lr': 0.0004999117185569354, 'samples': 624576, 'steps': 3252, 'loss/train': 2.0688071250915527} +11/06/2021 21:43:20 - INFO - __main__ - Step 3254: {'lr': 0.0004999115774842633, 'samples': 624768, 'steps': 3253, 'loss/train': 1.5158661603927612} +11/06/2021 21:43:20 - INFO - __main__ - Step 3255: {'lr': 0.0004999114362989849, 'samples': 624960, 'steps': 3254, 'loss/train': 2.2318007946014404} +11/06/2021 21:43:21 - INFO - __main__ - Step 3256: {'lr': 0.0004999112950011002, 'samples': 625152, 'steps': 3255, 'loss/train': 1.8678102493286133} +11/06/2021 21:43:22 - INFO - __main__ - Step 3257: {'lr': 0.0004999111535906094, 'samples': 625344, 'steps': 3256, 'loss/train': 2.0674848556518555} +11/06/2021 21:43:22 - INFO - __main__ - Step 3258: {'lr': 0.0004999110120675125, 'samples': 625536, 'steps': 3257, 'loss/train': 1.557898998260498} +11/06/2021 21:43:23 - INFO - __main__ - Step 3259: {'lr': 0.0004999108704318095, 'samples': 625728, 'steps': 3258, 'loss/train': 1.9527461528778076} +11/06/2021 21:43:23 - INFO - __main__ - Step 3260: {'lr': 0.0004999107286835006, 'samples': 625920, 'steps': 3259, 'loss/train': 0.5624179244041443} +11/06/2021 21:43:23 - INFO - __main__ - Step 3261: {'lr': 0.0004999105868225858, 'samples': 626112, 'steps': 3260, 'loss/train': 2.3505382537841797} +11/06/2021 21:43:24 - INFO - __main__ - Step 3262: {'lr': 0.0004999104448490649, 'samples': 626304, 'steps': 3261, 'loss/train': 1.716923475265503} +11/06/2021 21:43:25 - INFO - __main__ - Step 3263: {'lr': 0.0004999103027629384, 'samples': 626496, 'steps': 3262, 'loss/train': 2.0216355323791504} +11/06/2021 21:43:25 - INFO - __main__ - Step 3264: {'lr': 0.0004999101605642061, 'samples': 626688, 'steps': 3263, 'loss/train': 2.3034634590148926} +11/06/2021 21:43:25 - INFO - __main__ - Step 3265: {'lr': 0.0004999100182528683, 'samples': 626880, 'steps': 3264, 'loss/train': 2.1556177139282227} +11/06/2021 21:43:26 - INFO - __main__ - Step 3266: {'lr': 0.0004999098758289248, 'samples': 627072, 'steps': 3265, 'loss/train': 2.250798463821411} +11/06/2021 21:43:27 - INFO - __main__ - Step 3267: {'lr': 0.0004999097332923758, 'samples': 627264, 'steps': 3266, 'loss/train': 2.280691623687744} +11/06/2021 21:43:27 - INFO - __main__ - Step 3268: {'lr': 0.0004999095906432213, 'samples': 627456, 'steps': 3267, 'loss/train': 2.3557052612304688} +11/06/2021 21:43:28 - INFO - __main__ - Step 3269: {'lr': 0.0004999094478814613, 'samples': 627648, 'steps': 3268, 'loss/train': 2.4633193016052246} +11/06/2021 21:43:28 - INFO - __main__ - Step 3270: {'lr': 0.0004999093050070961, 'samples': 627840, 'steps': 3269, 'loss/train': 5.240302562713623} +11/06/2021 21:43:28 - INFO - __main__ - Step 3271: {'lr': 0.0004999091620201255, 'samples': 628032, 'steps': 3270, 'loss/train': 4.105412006378174} +11/06/2021 21:43:29 - INFO - __main__ - Step 3272: {'lr': 0.0004999090189205498, 'samples': 628224, 'steps': 3271, 'loss/train': 2.502105951309204} +11/06/2021 21:43:29 - INFO - __main__ - Step 3273: {'lr': 0.0004999088757083689, 'samples': 628416, 'steps': 3272, 'loss/train': 2.263211250305176} +11/06/2021 21:43:30 - INFO - __main__ - Step 3274: {'lr': 0.0004999087323835829, 'samples': 628608, 'steps': 3273, 'loss/train': 1.1719061136245728} +11/06/2021 21:43:31 - INFO - __main__ - Step 3275: {'lr': 0.0004999085889461919, 'samples': 628800, 'steps': 3274, 'loss/train': 2.298391103744507} +11/06/2021 21:43:31 - INFO - __main__ - Step 3276: {'lr': 0.0004999084453961959, 'samples': 628992, 'steps': 3275, 'loss/train': 1.848705530166626} +11/06/2021 21:43:31 - INFO - __main__ - Step 3277: {'lr': 0.0004999083017335951, 'samples': 629184, 'steps': 3276, 'loss/train': 2.3697509765625} +11/06/2021 21:43:32 - INFO - __main__ - Step 3278: {'lr': 0.0004999081579583895, 'samples': 629376, 'steps': 3277, 'loss/train': 1.937208652496338} +11/06/2021 21:43:33 - INFO - __main__ - Step 3279: {'lr': 0.0004999080140705791, 'samples': 629568, 'steps': 3278, 'loss/train': 2.3870885372161865} +11/06/2021 21:43:33 - INFO - __main__ - Step 3280: {'lr': 0.0004999078700701639, 'samples': 629760, 'steps': 3279, 'loss/train': 2.4358227252960205} +11/06/2021 21:43:33 - INFO - __main__ - Step 3281: {'lr': 0.0004999077259571442, 'samples': 629952, 'steps': 3280, 'loss/train': 2.139662504196167} +11/06/2021 21:43:34 - INFO - __main__ - Step 3282: {'lr': 0.0004999075817315199, 'samples': 630144, 'steps': 3281, 'loss/train': 2.3960695266723633} +11/06/2021 21:43:34 - INFO - __main__ - Step 3283: {'lr': 0.0004999074373932911, 'samples': 630336, 'steps': 3282, 'loss/train': 1.9690511226654053} +11/06/2021 21:43:35 - INFO - __main__ - Step 3284: {'lr': 0.0004999072929424579, 'samples': 630528, 'steps': 3283, 'loss/train': 1.8000233173370361} +11/06/2021 21:43:35 - INFO - __main__ - Step 3285: {'lr': 0.0004999071483790203, 'samples': 630720, 'steps': 3284, 'loss/train': 2.917104721069336} +11/06/2021 21:43:36 - INFO - __main__ - Step 3286: {'lr': 0.0004999070037029783, 'samples': 630912, 'steps': 3285, 'loss/train': 2.3763699531555176} +11/06/2021 21:43:36 - INFO - __main__ - Step 3287: {'lr': 0.0004999068589143322, 'samples': 631104, 'steps': 3286, 'loss/train': 2.728950023651123} +11/06/2021 21:43:36 - INFO - __main__ - Step 3288: {'lr': 0.0004999067140130819, 'samples': 631296, 'steps': 3287, 'loss/train': 2.0896875858306885} +11/06/2021 21:43:37 - INFO - __main__ - Step 3289: {'lr': 0.0004999065689992273, 'samples': 631488, 'steps': 3288, 'loss/train': 2.303443431854248} +11/06/2021 21:43:38 - INFO - __main__ - Step 3290: {'lr': 0.0004999064238727689, 'samples': 631680, 'steps': 3289, 'loss/train': 2.483797073364258} +11/06/2021 21:43:38 - INFO - __main__ - Step 3291: {'lr': 0.0004999062786337064, 'samples': 631872, 'steps': 3290, 'loss/train': 1.8650814294815063} +11/06/2021 21:43:39 - INFO - __main__ - Step 3292: {'lr': 0.0004999061332820401, 'samples': 632064, 'steps': 3291, 'loss/train': 1.7333624362945557} +11/06/2021 21:43:39 - INFO - __main__ - Step 3293: {'lr': 0.0004999059878177699, 'samples': 632256, 'steps': 3292, 'loss/train': 2.357539176940918} +11/06/2021 21:43:40 - INFO - __main__ - Step 3294: {'lr': 0.0004999058422408959, 'samples': 632448, 'steps': 3293, 'loss/train': 2.1987416744232178} +11/06/2021 21:43:40 - INFO - __main__ - Step 3295: {'lr': 0.0004999056965514181, 'samples': 632640, 'steps': 3294, 'loss/train': 1.9118432998657227} +11/06/2021 21:43:41 - INFO - __main__ - Step 3296: {'lr': 0.0004999055507493368, 'samples': 632832, 'steps': 3295, 'loss/train': 2.26961612701416} +11/06/2021 21:43:41 - INFO - __main__ - Step 3297: {'lr': 0.0004999054048346517, 'samples': 633024, 'steps': 3296, 'loss/train': 2.7712512016296387} +11/06/2021 21:43:41 - INFO - __main__ - Step 3298: {'lr': 0.0004999052588073633, 'samples': 633216, 'steps': 3297, 'loss/train': 2.1366281509399414} +11/06/2021 21:43:42 - INFO - __main__ - Step 3299: {'lr': 0.0004999051126674714, 'samples': 633408, 'steps': 3298, 'loss/train': 1.3426307439804077} +11/06/2021 21:43:43 - INFO - __main__ - Step 3300: {'lr': 0.0004999049664149761, 'samples': 633600, 'steps': 3299, 'loss/train': 3.066981315612793} +11/06/2021 21:43:43 - INFO - __main__ - Step 3301: {'lr': 0.0004999048200498774, 'samples': 633792, 'steps': 3300, 'loss/train': 2.1740355491638184} +11/06/2021 21:43:43 - INFO - __main__ - Step 3302: {'lr': 0.0004999046735721755, 'samples': 633984, 'steps': 3301, 'loss/train': 2.4104175567626953} +11/06/2021 21:43:44 - INFO - __main__ - Step 3303: {'lr': 0.0004999045269818704, 'samples': 634176, 'steps': 3302, 'loss/train': 2.4756033420562744} +11/06/2021 21:43:45 - INFO - __main__ - Step 3304: {'lr': 0.0004999043802789622, 'samples': 634368, 'steps': 3303, 'loss/train': 1.4023329019546509} +11/06/2021 21:43:45 - INFO - __main__ - Step 3305: {'lr': 0.000499904233463451, 'samples': 634560, 'steps': 3304, 'loss/train': 1.6189985275268555} +11/06/2021 21:43:45 - INFO - __main__ - Step 3306: {'lr': 0.0004999040865353367, 'samples': 634752, 'steps': 3305, 'loss/train': 1.5078233480453491} +11/06/2021 21:43:46 - INFO - __main__ - Step 3307: {'lr': 0.0004999039394946196, 'samples': 634944, 'steps': 3306, 'loss/train': 1.8554377555847168} +11/06/2021 21:43:46 - INFO - __main__ - Step 3308: {'lr': 0.0004999037923412995, 'samples': 635136, 'steps': 3307, 'loss/train': 2.242231845855713} +11/06/2021 21:43:47 - INFO - __main__ - Step 3309: {'lr': 0.0004999036450753767, 'samples': 635328, 'steps': 3308, 'loss/train': 2.1639621257781982} +11/06/2021 21:43:47 - INFO - __main__ - Step 3310: {'lr': 0.0004999034976968511, 'samples': 635520, 'steps': 3309, 'loss/train': 2.1223878860473633} +11/06/2021 21:43:48 - INFO - __main__ - Step 3311: {'lr': 0.0004999033502057228, 'samples': 635712, 'steps': 3310, 'loss/train': 2.3255131244659424} +11/06/2021 21:43:48 - INFO - __main__ - Step 3312: {'lr': 0.000499903202601992, 'samples': 635904, 'steps': 3311, 'loss/train': 2.050856113433838} +11/06/2021 21:43:48 - INFO - __main__ - Step 3313: {'lr': 0.0004999030548856586, 'samples': 636096, 'steps': 3312, 'loss/train': 1.3736777305603027} +11/06/2021 21:43:49 - INFO - __main__ - Step 3314: {'lr': 0.0004999029070567229, 'samples': 636288, 'steps': 3313, 'loss/train': 2.3344199657440186} +11/06/2021 21:43:50 - INFO - __main__ - Step 3315: {'lr': 0.0004999027591151847, 'samples': 636480, 'steps': 3314, 'loss/train': 2.361743927001953} +11/06/2021 21:43:50 - INFO - __main__ - Step 3316: {'lr': 0.0004999026110610442, 'samples': 636672, 'steps': 3315, 'loss/train': 1.3730331659317017} +11/06/2021 21:43:51 - INFO - __main__ - Step 3317: {'lr': 0.0004999024628943014, 'samples': 636864, 'steps': 3316, 'loss/train': 2.4670941829681396} +11/06/2021 21:43:51 - INFO - __main__ - Step 3318: {'lr': 0.0004999023146149565, 'samples': 637056, 'steps': 3317, 'loss/train': 1.93985116481781} +11/06/2021 21:43:51 - INFO - __main__ - Step 3319: {'lr': 0.0004999021662230093, 'samples': 637248, 'steps': 3318, 'loss/train': 1.4250794649124146} +11/06/2021 21:43:52 - INFO - __main__ - Step 3320: {'lr': 0.0004999020177184601, 'samples': 637440, 'steps': 3319, 'loss/train': 2.3671536445617676} +11/06/2021 21:43:53 - INFO - __main__ - Step 3321: {'lr': 0.000499901869101309, 'samples': 637632, 'steps': 3320, 'loss/train': 2.1804182529449463} +11/06/2021 21:43:53 - INFO - __main__ - Step 3322: {'lr': 0.0004999017203715559, 'samples': 637824, 'steps': 3321, 'loss/train': 2.0329232215881348} +11/06/2021 21:43:53 - INFO - __main__ - Step 3323: {'lr': 0.000499901571529201, 'samples': 638016, 'steps': 3322, 'loss/train': 1.9539903402328491} +11/06/2021 21:43:54 - INFO - __main__ - Step 3324: {'lr': 0.0004999014225742442, 'samples': 638208, 'steps': 3323, 'loss/train': 1.762226939201355} +11/06/2021 21:43:55 - INFO - __main__ - Step 3325: {'lr': 0.0004999012735066858, 'samples': 638400, 'steps': 3324, 'loss/train': 2.084671974182129} +11/06/2021 21:43:55 - INFO - __main__ - Step 3326: {'lr': 0.0004999011243265257, 'samples': 638592, 'steps': 3325, 'loss/train': 2.541097402572632} +11/06/2021 21:43:55 - INFO - __main__ - Step 3327: {'lr': 0.000499900975033764, 'samples': 638784, 'steps': 3326, 'loss/train': 2.444103240966797} +11/06/2021 21:43:56 - INFO - __main__ - Step 3328: {'lr': 0.0004999008256284008, 'samples': 638976, 'steps': 3327, 'loss/train': 2.3885836601257324} +11/06/2021 21:43:56 - INFO - __main__ - Step 3329: {'lr': 0.0004999006761104361, 'samples': 639168, 'steps': 3328, 'loss/train': 1.9459644556045532} +11/06/2021 21:43:57 - INFO - __main__ - Step 3330: {'lr': 0.0004999005264798701, 'samples': 639360, 'steps': 3329, 'loss/train': 2.031470775604248} +11/06/2021 21:43:58 - INFO - __main__ - Step 3331: {'lr': 0.0004999003767367027, 'samples': 639552, 'steps': 3330, 'loss/train': 2.199577808380127} +11/06/2021 21:43:58 - INFO - __main__ - Step 3332: {'lr': 0.0004999002268809339, 'samples': 639744, 'steps': 3331, 'loss/train': 2.1211884021759033} +11/06/2021 21:43:59 - INFO - __main__ - Step 3333: {'lr': 0.0004999000769125642, 'samples': 639936, 'steps': 3332, 'loss/train': 3.076802968978882} +11/06/2021 21:43:59 - INFO - __main__ - Step 3334: {'lr': 0.0004998999268315932, 'samples': 640128, 'steps': 3333, 'loss/train': 2.300365447998047} +11/06/2021 21:43:59 - INFO - __main__ - Step 3335: {'lr': 0.0004998997766380212, 'samples': 640320, 'steps': 3334, 'loss/train': 2.047560214996338} +11/06/2021 21:44:00 - INFO - __main__ - Step 3336: {'lr': 0.0004998996263318482, 'samples': 640512, 'steps': 3335, 'loss/train': 2.0564115047454834} +11/06/2021 21:44:00 - INFO - __main__ - Step 3337: {'lr': 0.0004998994759130743, 'samples': 640704, 'steps': 3336, 'loss/train': 1.807005763053894} +11/06/2021 21:44:01 - INFO - __main__ - Step 3338: {'lr': 0.0004998993253816996, 'samples': 640896, 'steps': 3337, 'loss/train': 2.106369733810425} +11/06/2021 21:44:01 - INFO - __main__ - Step 3339: {'lr': 0.000499899174737724, 'samples': 641088, 'steps': 3338, 'loss/train': 2.363450765609741} +11/06/2021 21:44:02 - INFO - __main__ - Step 3340: {'lr': 0.0004998990239811477, 'samples': 641280, 'steps': 3339, 'loss/train': 1.9341990947723389} +11/06/2021 21:44:03 - INFO - __main__ - Step 3341: {'lr': 0.0004998988731119709, 'samples': 641472, 'steps': 3340, 'loss/train': 2.0908918380737305} +11/06/2021 21:44:03 - INFO - __main__ - Step 3342: {'lr': 0.0004998987221301935, 'samples': 641664, 'steps': 3341, 'loss/train': 2.078077793121338} +11/06/2021 21:44:03 - INFO - __main__ - Step 3343: {'lr': 0.0004998985710358155, 'samples': 641856, 'steps': 3342, 'loss/train': 1.9851315021514893} +11/06/2021 21:44:04 - INFO - __main__ - Step 3344: {'lr': 0.0004998984198288371, 'samples': 642048, 'steps': 3343, 'loss/train': 2.1168434619903564} +11/06/2021 21:44:04 - INFO - __main__ - Step 3345: {'lr': 0.0004998982685092583, 'samples': 642240, 'steps': 3344, 'loss/train': 2.281632900238037} +11/06/2021 21:44:05 - INFO - __main__ - Step 3346: {'lr': 0.0004998981170770792, 'samples': 642432, 'steps': 3345, 'loss/train': 2.356718063354492} +11/06/2021 21:44:05 - INFO - __main__ - Step 3347: {'lr': 0.0004998979655323, 'samples': 642624, 'steps': 3346, 'loss/train': 1.8560844659805298} +11/06/2021 21:44:06 - INFO - __main__ - Step 3348: {'lr': 0.0004998978138749204, 'samples': 642816, 'steps': 3347, 'loss/train': 1.9993972778320312} +11/06/2021 21:44:06 - INFO - __main__ - Step 3349: {'lr': 0.0004998976621049408, 'samples': 643008, 'steps': 3348, 'loss/train': 2.5754454135894775} +11/06/2021 21:44:06 - INFO - __main__ - Step 3350: {'lr': 0.0004998975102223612, 'samples': 643200, 'steps': 3349, 'loss/train': 2.1721551418304443} +11/06/2021 21:44:08 - INFO - __main__ - Step 3351: {'lr': 0.0004998973582271817, 'samples': 643392, 'steps': 3350, 'loss/train': 1.9218946695327759} +11/06/2021 21:44:08 - INFO - __main__ - Step 3352: {'lr': 0.0004998972061194022, 'samples': 643584, 'steps': 3351, 'loss/train': 2.063539743423462} +11/06/2021 21:44:08 - INFO - __main__ - Step 3353: {'lr': 0.0004998970538990228, 'samples': 643776, 'steps': 3352, 'loss/train': 2.91345477104187} +11/06/2021 21:44:09 - INFO - __main__ - Step 3354: {'lr': 0.0004998969015660438, 'samples': 643968, 'steps': 3353, 'loss/train': 1.8647414445877075} +11/06/2021 21:44:09 - INFO - __main__ - Step 3355: {'lr': 0.0004998967491204651, 'samples': 644160, 'steps': 3354, 'loss/train': 2.418487787246704} +11/06/2021 21:44:09 - INFO - __main__ - Step 3356: {'lr': 0.0004998965965622867, 'samples': 644352, 'steps': 3355, 'loss/train': 1.3407362699508667} +11/06/2021 21:44:11 - INFO - __main__ - Step 3357: {'lr': 0.0004998964438915088, 'samples': 644544, 'steps': 3356, 'loss/train': 2.0935134887695312} +11/06/2021 21:44:11 - INFO - __main__ - Step 3358: {'lr': 0.0004998962911081314, 'samples': 644736, 'steps': 3357, 'loss/train': 2.340810775756836} +11/06/2021 21:44:11 - INFO - __main__ - Step 3359: {'lr': 0.0004998961382121546, 'samples': 644928, 'steps': 3358, 'loss/train': 2.3082637786865234} +11/06/2021 21:44:12 - INFO - __main__ - Step 3360: {'lr': 0.0004998959852035785, 'samples': 645120, 'steps': 3359, 'loss/train': 1.8081005811691284} +11/06/2021 21:44:12 - INFO - __main__ - Step 3361: {'lr': 0.0004998958320824031, 'samples': 645312, 'steps': 3360, 'loss/train': 2.52008318901062} +11/06/2021 21:44:13 - INFO - __main__ - Step 3362: {'lr': 0.0004998956788486284, 'samples': 645504, 'steps': 3361, 'loss/train': 2.574852228164673} +11/06/2021 21:44:13 - INFO - __main__ - Step 3363: {'lr': 0.0004998955255022547, 'samples': 645696, 'steps': 3362, 'loss/train': 2.9360525608062744} +11/06/2021 21:44:14 - INFO - __main__ - Step 3364: {'lr': 0.0004998953720432818, 'samples': 645888, 'steps': 3363, 'loss/train': 2.0350911617279053} +11/06/2021 21:44:14 - INFO - __main__ - Step 3365: {'lr': 0.00049989521847171, 'samples': 646080, 'steps': 3364, 'loss/train': 1.7591485977172852} +11/06/2021 21:44:14 - INFO - __main__ - Step 3366: {'lr': 0.0004998950647875392, 'samples': 646272, 'steps': 3365, 'loss/train': 1.764539122581482} +11/06/2021 21:44:15 - INFO - __main__ - Step 3367: {'lr': 0.0004998949109907697, 'samples': 646464, 'steps': 3366, 'loss/train': 2.29533052444458} +11/06/2021 21:44:16 - INFO - __main__ - Step 3368: {'lr': 0.0004998947570814012, 'samples': 646656, 'steps': 3367, 'loss/train': 2.4703001976013184} +11/06/2021 21:44:16 - INFO - __main__ - Step 3369: {'lr': 0.0004998946030594341, 'samples': 646848, 'steps': 3368, 'loss/train': 2.0543324947357178} +11/06/2021 21:44:16 - INFO - __main__ - Step 3370: {'lr': 0.0004998944489248683, 'samples': 647040, 'steps': 3369, 'loss/train': 2.8122878074645996} +11/06/2021 21:44:17 - INFO - __main__ - Step 3371: {'lr': 0.000499894294677704, 'samples': 647232, 'steps': 3370, 'loss/train': 2.024826765060425} +11/06/2021 21:44:18 - INFO - __main__ - Step 3372: {'lr': 0.000499894140317941, 'samples': 647424, 'steps': 3371, 'loss/train': 2.372493267059326} +11/06/2021 21:44:18 - INFO - __main__ - Step 3373: {'lr': 0.0004998939858455798, 'samples': 647616, 'steps': 3372, 'loss/train': 1.8553732633590698} +11/06/2021 21:44:19 - INFO - __main__ - Step 3374: {'lr': 0.0004998938312606201, 'samples': 647808, 'steps': 3373, 'loss/train': 6.488889694213867} +11/06/2021 21:44:19 - INFO - __main__ - Step 3375: {'lr': 0.000499893676563062, 'samples': 648000, 'steps': 3374, 'loss/train': 2.1932318210601807} +11/06/2021 21:44:19 - INFO - __main__ - Step 3376: {'lr': 0.0004998935217529058, 'samples': 648192, 'steps': 3375, 'loss/train': 2.0442917346954346} +11/06/2021 21:44:20 - INFO - __main__ - Step 3377: {'lr': 0.0004998933668301514, 'samples': 648384, 'steps': 3376, 'loss/train': 1.9358372688293457} +11/06/2021 21:44:21 - INFO - __main__ - Step 3378: {'lr': 0.0004998932117947989, 'samples': 648576, 'steps': 3377, 'loss/train': 1.9061901569366455} +11/06/2021 21:44:21 - INFO - __main__ - Step 3379: {'lr': 0.0004998930566468484, 'samples': 648768, 'steps': 3378, 'loss/train': 2.5020077228546143} +11/06/2021 21:44:21 - INFO - __main__ - Step 3380: {'lr': 0.0004998929013863, 'samples': 648960, 'steps': 3379, 'loss/train': 1.080916404724121} +11/06/2021 21:44:22 - INFO - __main__ - Step 3381: {'lr': 0.0004998927460131535, 'samples': 649152, 'steps': 3380, 'loss/train': 2.488973379135132} +11/06/2021 21:44:22 - INFO - __main__ - Step 3382: {'lr': 0.0004998925905274094, 'samples': 649344, 'steps': 3381, 'loss/train': 1.9152915477752686} +11/06/2021 21:44:23 - INFO - __main__ - Step 3383: {'lr': 0.0004998924349290674, 'samples': 649536, 'steps': 3382, 'loss/train': 0.7557737827301025} +11/06/2021 21:44:24 - INFO - __main__ - Step 3384: {'lr': 0.0004998922792181278, 'samples': 649728, 'steps': 3383, 'loss/train': 1.4994975328445435} +11/06/2021 21:44:24 - INFO - __main__ - Step 3385: {'lr': 0.0004998921233945907, 'samples': 649920, 'steps': 3384, 'loss/train': 1.6330103874206543} +11/06/2021 21:44:24 - INFO - __main__ - Step 3386: {'lr': 0.0004998919674584559, 'samples': 650112, 'steps': 3385, 'loss/train': 1.484663486480713} +11/06/2021 21:44:25 - INFO - __main__ - Step 3387: {'lr': 0.0004998918114097237, 'samples': 650304, 'steps': 3386, 'loss/train': 2.346414566040039} +11/06/2021 21:44:26 - INFO - __main__ - Step 3388: {'lr': 0.0004998916552483941, 'samples': 650496, 'steps': 3387, 'loss/train': 1.351393699645996} +11/06/2021 21:44:26 - INFO - __main__ - Step 3389: {'lr': 0.0004998914989744671, 'samples': 650688, 'steps': 3388, 'loss/train': 2.10522198677063} +11/06/2021 21:44:26 - INFO - __main__ - Step 3390: {'lr': 0.000499891342587943, 'samples': 650880, 'steps': 3389, 'loss/train': 1.9814081192016602} +11/06/2021 21:44:27 - INFO - __main__ - Step 3391: {'lr': 0.0004998911860888217, 'samples': 651072, 'steps': 3390, 'loss/train': 1.96201491355896} +11/06/2021 21:44:27 - INFO - __main__ - Step 3392: {'lr': 0.0004998910294771032, 'samples': 651264, 'steps': 3391, 'loss/train': 2.6143369674682617} +11/06/2021 21:44:28 - INFO - __main__ - Step 3393: {'lr': 0.0004998908727527877, 'samples': 651456, 'steps': 3392, 'loss/train': 2.523289442062378} +11/06/2021 21:44:28 - INFO - __main__ - Step 3394: {'lr': 0.0004998907159158752, 'samples': 651648, 'steps': 3393, 'loss/train': 1.4275950193405151} +11/06/2021 21:44:29 - INFO - __main__ - Step 3395: {'lr': 0.0004998905589663658, 'samples': 651840, 'steps': 3394, 'loss/train': 2.1565451622009277} +11/06/2021 21:44:29 - INFO - __main__ - Step 3396: {'lr': 0.0004998904019042596, 'samples': 652032, 'steps': 3395, 'loss/train': 2.2461233139038086} +11/06/2021 21:44:30 - INFO - __main__ - Step 3397: {'lr': 0.0004998902447295567, 'samples': 652224, 'steps': 3396, 'loss/train': 2.1691172122955322} +11/06/2021 21:44:31 - INFO - __main__ - Step 3398: {'lr': 0.000499890087442257, 'samples': 652416, 'steps': 3397, 'loss/train': 2.0089993476867676} +11/06/2021 21:44:31 - INFO - __main__ - Step 3399: {'lr': 0.0004998899300423607, 'samples': 652608, 'steps': 3398, 'loss/train': 2.1266562938690186} +11/06/2021 21:44:31 - INFO - __main__ - Step 3400: {'lr': 0.0004998897725298679, 'samples': 652800, 'steps': 3399, 'loss/train': 1.9188565015792847} +11/06/2021 21:44:32 - INFO - __main__ - Step 3401: {'lr': 0.0004998896149047786, 'samples': 652992, 'steps': 3400, 'loss/train': 2.4505343437194824} +11/06/2021 21:44:32 - INFO - __main__ - Step 3402: {'lr': 0.0004998894571670929, 'samples': 653184, 'steps': 3401, 'loss/train': 2.3925869464874268} +11/06/2021 21:44:32 - INFO - __main__ - Step 3403: {'lr': 0.0004998892993168109, 'samples': 653376, 'steps': 3402, 'loss/train': 2.170724391937256} +11/06/2021 21:44:33 - INFO - __main__ - Step 3404: {'lr': 0.0004998891413539326, 'samples': 653568, 'steps': 3403, 'loss/train': 1.9499857425689697} +11/06/2021 21:44:34 - INFO - __main__ - Step 3405: {'lr': 0.0004998889832784581, 'samples': 653760, 'steps': 3404, 'loss/train': 2.608039379119873} +11/06/2021 21:44:34 - INFO - __main__ - Step 3406: {'lr': 0.0004998888250903875, 'samples': 653952, 'steps': 3405, 'loss/train': 2.1653521060943604} +11/06/2021 21:44:34 - INFO - __main__ - Step 3407: {'lr': 0.0004998886667897209, 'samples': 654144, 'steps': 3406, 'loss/train': 2.1557538509368896} +11/06/2021 21:44:35 - INFO - __main__ - Step 3408: {'lr': 0.0004998885083764582, 'samples': 654336, 'steps': 3407, 'loss/train': 2.54028582572937} +11/06/2021 21:44:36 - INFO - __main__ - Step 3409: {'lr': 0.0004998883498505996, 'samples': 654528, 'steps': 3408, 'loss/train': 2.0685014724731445} +11/06/2021 21:44:36 - INFO - __main__ - Step 3410: {'lr': 0.0004998881912121453, 'samples': 654720, 'steps': 3409, 'loss/train': 1.7899914979934692} +11/06/2021 21:44:37 - INFO - __main__ - Step 3411: {'lr': 0.0004998880324610952, 'samples': 654912, 'steps': 3410, 'loss/train': 2.2215492725372314} +11/06/2021 21:44:37 - INFO - __main__ - Step 3412: {'lr': 0.0004998878735974493, 'samples': 655104, 'steps': 3411, 'loss/train': 2.2348644733428955} +11/06/2021 21:44:37 - INFO - __main__ - Step 3413: {'lr': 0.0004998877146212079, 'samples': 655296, 'steps': 3412, 'loss/train': 2.385568618774414} +11/06/2021 21:44:38 - INFO - __main__ - Step 3414: {'lr': 0.0004998875555323708, 'samples': 655488, 'steps': 3413, 'loss/train': 2.1982250213623047} +11/06/2021 21:44:38 - INFO - __main__ - Step 3415: {'lr': 0.0004998873963309384, 'samples': 655680, 'steps': 3414, 'loss/train': 2.085184097290039} +11/06/2021 21:44:39 - INFO - __main__ - Step 3416: {'lr': 0.0004998872370169105, 'samples': 655872, 'steps': 3415, 'loss/train': 2.228264808654785} +11/06/2021 21:44:39 - INFO - __main__ - Step 3417: {'lr': 0.0004998870775902872, 'samples': 656064, 'steps': 3416, 'loss/train': 2.356597900390625} +11/06/2021 21:44:40 - INFO - __main__ - Step 3418: {'lr': 0.0004998869180510688, 'samples': 656256, 'steps': 3417, 'loss/train': 1.9543739557266235} +11/06/2021 21:44:41 - INFO - __main__ - Step 3419: {'lr': 0.0004998867583992551, 'samples': 656448, 'steps': 3418, 'loss/train': 1.8418172597885132} +11/06/2021 21:44:41 - INFO - __main__ - Step 3420: {'lr': 0.0004998865986348464, 'samples': 656640, 'steps': 3419, 'loss/train': 1.725966453552246} +11/06/2021 21:44:42 - INFO - __main__ - Step 3421: {'lr': 0.0004998864387578426, 'samples': 656832, 'steps': 3420, 'loss/train': 1.9191683530807495} +11/06/2021 21:44:42 - INFO - __main__ - Step 3422: {'lr': 0.0004998862787682438, 'samples': 657024, 'steps': 3421, 'loss/train': 2.177302598953247} +11/06/2021 21:44:42 - INFO - __main__ - Step 3423: {'lr': 0.00049988611866605, 'samples': 657216, 'steps': 3422, 'loss/train': 1.9818519353866577} +11/06/2021 21:44:43 - INFO - __main__ - Step 3424: {'lr': 0.0004998859584512615, 'samples': 657408, 'steps': 3423, 'loss/train': 2.42037296295166} +11/06/2021 21:44:44 - INFO - __main__ - Step 3425: {'lr': 0.0004998857981238782, 'samples': 657600, 'steps': 3424, 'loss/train': 0.6604869961738586} +11/06/2021 21:44:44 - INFO - __main__ - Step 3426: {'lr': 0.0004998856376839003, 'samples': 657792, 'steps': 3425, 'loss/train': 0.3991982340812683} +11/06/2021 21:44:45 - INFO - __main__ - Step 3427: {'lr': 0.0004998854771313277, 'samples': 657984, 'steps': 3426, 'loss/train': 2.094467878341675} +11/06/2021 21:44:45 - INFO - __main__ - Step 3428: {'lr': 0.0004998853164661606, 'samples': 658176, 'steps': 3427, 'loss/train': 1.7819459438323975} +11/06/2021 21:44:45 - INFO - __main__ - Step 3429: {'lr': 0.000499885155688399, 'samples': 658368, 'steps': 3428, 'loss/train': 2.345151901245117} +11/06/2021 21:44:46 - INFO - __main__ - Step 3430: {'lr': 0.000499884994798043, 'samples': 658560, 'steps': 3429, 'loss/train': 1.721934199333191} +11/06/2021 21:44:47 - INFO - __main__ - Step 3431: {'lr': 0.0004998848337950927, 'samples': 658752, 'steps': 3430, 'loss/train': 1.6747421026229858} +11/06/2021 21:44:47 - INFO - __main__ - Step 3432: {'lr': 0.0004998846726795482, 'samples': 658944, 'steps': 3431, 'loss/train': 2.4393625259399414} +11/06/2021 21:44:47 - INFO - __main__ - Step 3433: {'lr': 0.0004998845114514095, 'samples': 659136, 'steps': 3432, 'loss/train': 1.8727471828460693} +11/06/2021 21:44:48 - INFO - __main__ - Step 3434: {'lr': 0.0004998843501106766, 'samples': 659328, 'steps': 3433, 'loss/train': 2.1409528255462646} +11/06/2021 21:44:49 - INFO - __main__ - Step 3435: {'lr': 0.0004998841886573496, 'samples': 659520, 'steps': 3434, 'loss/train': 2.510873317718506} +11/06/2021 21:44:49 - INFO - __main__ - Step 3436: {'lr': 0.0004998840270914288, 'samples': 659712, 'steps': 3435, 'loss/train': 1.8569953441619873} +11/06/2021 21:44:50 - INFO - __main__ - Step 3437: {'lr': 0.0004998838654129142, 'samples': 659904, 'steps': 3436, 'loss/train': 1.0409950017929077} +11/06/2021 21:44:50 - INFO - __main__ - Step 3438: {'lr': 0.0004998837036218056, 'samples': 660096, 'steps': 3437, 'loss/train': 2.066178798675537} +11/06/2021 21:44:51 - INFO - __main__ - Step 3439: {'lr': 0.0004998835417181033, 'samples': 660288, 'steps': 3438, 'loss/train': 1.7412632703781128} +11/06/2021 21:44:52 - INFO - __main__ - Step 3440: {'lr': 0.0004998833797018074, 'samples': 660480, 'steps': 3439, 'loss/train': 1.823896050453186} +11/06/2021 21:44:52 - INFO - __main__ - Step 3441: {'lr': 0.0004998832175729179, 'samples': 660672, 'steps': 3440, 'loss/train': 2.1356678009033203} +11/06/2021 21:44:52 - INFO - __main__ - Step 3442: {'lr': 0.0004998830553314349, 'samples': 660864, 'steps': 3441, 'loss/train': 1.7477060556411743} +11/06/2021 21:44:53 - INFO - __main__ - Step 3443: {'lr': 0.0004998828929773583, 'samples': 661056, 'steps': 3442, 'loss/train': 2.1472830772399902} +11/06/2021 21:44:53 - INFO - __main__ - Step 3444: {'lr': 0.0004998827305106884, 'samples': 661248, 'steps': 3443, 'loss/train': 1.7395120859146118} +11/06/2021 21:44:54 - INFO - __main__ - Step 3445: {'lr': 0.0004998825679314253, 'samples': 661440, 'steps': 3444, 'loss/train': 2.5220179557800293} +11/06/2021 21:44:54 - INFO - __main__ - Step 3446: {'lr': 0.0004998824052395689, 'samples': 661632, 'steps': 3445, 'loss/train': 2.2687270641326904} +11/06/2021 21:44:55 - INFO - __main__ - Step 3447: {'lr': 0.0004998822424351193, 'samples': 661824, 'steps': 3446, 'loss/train': 2.2349984645843506} +11/06/2021 21:44:55 - INFO - __main__ - Step 3448: {'lr': 0.0004998820795180766, 'samples': 662016, 'steps': 3447, 'loss/train': 2.5539913177490234} +11/06/2021 21:44:55 - INFO - __main__ - Step 3449: {'lr': 0.000499881916488441, 'samples': 662208, 'steps': 3448, 'loss/train': 1.9206302165985107} +11/06/2021 21:44:57 - INFO - __main__ - Step 3450: {'lr': 0.0004998817533462123, 'samples': 662400, 'steps': 3449, 'loss/train': 2.2440977096557617} +11/06/2021 21:44:57 - INFO - __main__ - Step 3451: {'lr': 0.0004998815900913909, 'samples': 662592, 'steps': 3450, 'loss/train': 1.2015467882156372} +11/06/2021 21:44:57 - INFO - __main__ - Step 3452: {'lr': 0.0004998814267239767, 'samples': 662784, 'steps': 3451, 'loss/train': 2.6361520290374756} +11/06/2021 21:44:58 - INFO - __main__ - Step 3453: {'lr': 0.0004998812632439697, 'samples': 662976, 'steps': 3452, 'loss/train': 1.7184646129608154} +11/06/2021 21:44:58 - INFO - __main__ - Step 3454: {'lr': 0.00049988109965137, 'samples': 663168, 'steps': 3453, 'loss/train': 2.2237768173217773} +11/06/2021 21:44:58 - INFO - __main__ - Step 3455: {'lr': 0.000499880935946178, 'samples': 663360, 'steps': 3454, 'loss/train': 1.60335111618042} +11/06/2021 21:44:59 - INFO - __main__ - Step 3456: {'lr': 0.0004998807721283932, 'samples': 663552, 'steps': 3455, 'loss/train': 4.451015472412109} +11/06/2021 21:45:00 - INFO - __main__ - Step 3457: {'lr': 0.0004998806081980162, 'samples': 663744, 'steps': 3456, 'loss/train': 2.589240074157715} +11/06/2021 21:45:00 - INFO - __main__ - Step 3458: {'lr': 0.0004998804441550467, 'samples': 663936, 'steps': 3457, 'loss/train': 1.5202341079711914} +11/06/2021 21:45:00 - INFO - __main__ - Step 3459: {'lr': 0.000499880279999485, 'samples': 664128, 'steps': 3458, 'loss/train': 2.2377476692199707} +11/06/2021 21:45:01 - INFO - __main__ - Step 3460: {'lr': 0.0004998801157313311, 'samples': 664320, 'steps': 3459, 'loss/train': 2.0967650413513184} +11/06/2021 21:45:02 - INFO - __main__ - Step 3461: {'lr': 0.0004998799513505851, 'samples': 664512, 'steps': 3460, 'loss/train': 2.196791648864746} +11/06/2021 21:45:02 - INFO - __main__ - Step 3462: {'lr': 0.000499879786857247, 'samples': 664704, 'steps': 3461, 'loss/train': 2.2895452976226807} +11/06/2021 21:45:02 - INFO - __main__ - Step 3463: {'lr': 0.0004998796222513169, 'samples': 664896, 'steps': 3462, 'loss/train': 2.4116644859313965} +11/06/2021 21:45:03 - INFO - __main__ - Step 3464: {'lr': 0.000499879457532795, 'samples': 665088, 'steps': 3463, 'loss/train': 2.3247618675231934} +11/06/2021 21:45:03 - INFO - __main__ - Step 3465: {'lr': 0.0004998792927016812, 'samples': 665280, 'steps': 3464, 'loss/train': 2.557910203933716} +11/06/2021 21:45:04 - INFO - __main__ - Step 3466: {'lr': 0.0004998791277579757, 'samples': 665472, 'steps': 3465, 'loss/train': 2.2992501258850098} +11/06/2021 21:45:04 - INFO - __main__ - Step 3467: {'lr': 0.0004998789627016784, 'samples': 665664, 'steps': 3466, 'loss/train': 2.114197254180908} +11/06/2021 21:45:05 - INFO - __main__ - Step 3468: {'lr': 0.0004998787975327896, 'samples': 665856, 'steps': 3467, 'loss/train': 2.2296416759490967} +11/06/2021 21:45:05 - INFO - __main__ - Step 3469: {'lr': 0.0004998786322513093, 'samples': 666048, 'steps': 3468, 'loss/train': 2.309483528137207} +11/06/2021 21:45:05 - INFO - __main__ - Step 3470: {'lr': 0.0004998784668572375, 'samples': 666240, 'steps': 3469, 'loss/train': 1.9443069696426392} +11/06/2021 21:45:06 - INFO - __main__ - Step 3471: {'lr': 0.0004998783013505743, 'samples': 666432, 'steps': 3470, 'loss/train': 2.0072755813598633} +11/06/2021 21:45:07 - INFO - __main__ - Step 3472: {'lr': 0.0004998781357313198, 'samples': 666624, 'steps': 3471, 'loss/train': 2.455528974533081} +11/06/2021 21:45:07 - INFO - __main__ - Step 3473: {'lr': 0.0004998779699994741, 'samples': 666816, 'steps': 3472, 'loss/train': 2.9603943824768066} +11/06/2021 21:45:07 - INFO - __main__ - Step 3474: {'lr': 0.0004998778041550372, 'samples': 667008, 'steps': 3473, 'loss/train': 2.1143574714660645} +11/06/2021 21:45:08 - INFO - __main__ - Step 3475: {'lr': 0.0004998776381980092, 'samples': 667200, 'steps': 3474, 'loss/train': 2.124244213104248} +11/06/2021 21:45:08 - INFO - __main__ - Step 3476: {'lr': 0.0004998774721283903, 'samples': 667392, 'steps': 3475, 'loss/train': 2.0879619121551514} +11/06/2021 21:45:09 - INFO - __main__ - Step 3477: {'lr': 0.0004998773059461803, 'samples': 667584, 'steps': 3476, 'loss/train': 2.3110809326171875} +11/06/2021 21:45:10 - INFO - __main__ - Step 3478: {'lr': 0.0004998771396513796, 'samples': 667776, 'steps': 3477, 'loss/train': 2.4501490592956543} +11/06/2021 21:45:10 - INFO - __main__ - Step 3479: {'lr': 0.000499876973243988, 'samples': 667968, 'steps': 3478, 'loss/train': 1.411661148071289} +11/06/2021 21:45:10 - INFO - __main__ - Step 3480: {'lr': 0.0004998768067240059, 'samples': 668160, 'steps': 3479, 'loss/train': 2.6114776134490967} +11/06/2021 21:45:11 - INFO - __main__ - Step 3481: {'lr': 0.0004998766400914329, 'samples': 668352, 'steps': 3480, 'loss/train': 2.1029934883117676} +11/06/2021 21:45:12 - INFO - __main__ - Step 3482: {'lr': 0.0004998764733462694, 'samples': 668544, 'steps': 3481, 'loss/train': 1.7680230140686035} +11/06/2021 21:45:12 - INFO - __main__ - Step 3483: {'lr': 0.0004998763064885155, 'samples': 668736, 'steps': 3482, 'loss/train': 2.153639554977417} +11/06/2021 21:45:12 - INFO - __main__ - Step 3484: {'lr': 0.0004998761395181712, 'samples': 668928, 'steps': 3483, 'loss/train': 2.03013014793396} +11/06/2021 21:45:13 - INFO - __main__ - Step 3485: {'lr': 0.0004998759724352365, 'samples': 669120, 'steps': 3484, 'loss/train': 0.6211015582084656} +11/06/2021 21:45:13 - INFO - __main__ - Step 3486: {'lr': 0.0004998758052397115, 'samples': 669312, 'steps': 3485, 'loss/train': 1.9367340803146362} +11/06/2021 21:45:14 - INFO - __main__ - Step 3487: {'lr': 0.0004998756379315964, 'samples': 669504, 'steps': 3486, 'loss/train': 1.8777623176574707} +11/06/2021 21:45:14 - INFO - __main__ - Step 3488: {'lr': 0.0004998754705108912, 'samples': 669696, 'steps': 3487, 'loss/train': 2.432539939880371} +11/06/2021 21:45:15 - INFO - __main__ - Step 3489: {'lr': 0.000499875302977596, 'samples': 669888, 'steps': 3488, 'loss/train': 2.30979585647583} +11/06/2021 21:45:15 - INFO - __main__ - Step 3490: {'lr': 0.0004998751353317108, 'samples': 670080, 'steps': 3489, 'loss/train': 2.282562017440796} +11/06/2021 21:45:15 - INFO - __main__ - Step 3491: {'lr': 0.0004998749675732357, 'samples': 670272, 'steps': 3490, 'loss/train': 2.008915662765503} +11/06/2021 21:45:17 - INFO - __main__ - Step 3492: {'lr': 0.0004998747997021708, 'samples': 670464, 'steps': 3491, 'loss/train': 2.295339584350586} +11/06/2021 21:45:17 - INFO - __main__ - Step 3493: {'lr': 0.0004998746317185162, 'samples': 670656, 'steps': 3492, 'loss/train': 2.1820249557495117} +11/06/2021 21:45:18 - INFO - __main__ - Step 3494: {'lr': 0.000499874463622272, 'samples': 670848, 'steps': 3493, 'loss/train': 2.051396131515503} +11/06/2021 21:45:18 - INFO - __main__ - Step 3495: {'lr': 0.000499874295413438, 'samples': 671040, 'steps': 3494, 'loss/train': 1.9268534183502197} +11/06/2021 21:45:18 - INFO - __main__ - Step 3496: {'lr': 0.0004998741270920147, 'samples': 671232, 'steps': 3495, 'loss/train': 2.2112491130828857} +11/06/2021 21:45:19 - INFO - __main__ - Step 3497: {'lr': 0.0004998739586580019, 'samples': 671424, 'steps': 3496, 'loss/train': 2.0771069526672363} +11/06/2021 21:45:19 - INFO - __main__ - Step 3498: {'lr': 0.0004998737901113999, 'samples': 671616, 'steps': 3497, 'loss/train': 5.947204113006592} +11/06/2021 21:45:20 - INFO - __main__ - Step 3499: {'lr': 0.0004998736214522084, 'samples': 671808, 'steps': 3498, 'loss/train': 3.6572864055633545} +11/06/2021 21:45:20 - INFO - __main__ - Step 3500: {'lr': 0.0004998734526804278, 'samples': 672000, 'steps': 3499, 'loss/train': 2.2772557735443115} +11/06/2021 21:45:21 - INFO - __main__ - Step 3501: {'lr': 0.0004998732837960581, 'samples': 672192, 'steps': 3500, 'loss/train': 1.6389656066894531} +11/06/2021 21:45:21 - INFO - __main__ - Step 3502: {'lr': 0.0004998731147990993, 'samples': 672384, 'steps': 3501, 'loss/train': 2.0018649101257324} +11/06/2021 21:45:21 - INFO - __main__ - Step 3503: {'lr': 0.0004998729456895516, 'samples': 672576, 'steps': 3502, 'loss/train': 2.645084857940674} +11/06/2021 21:45:23 - INFO - __main__ - Step 3504: {'lr': 0.0004998727764674149, 'samples': 672768, 'steps': 3503, 'loss/train': 2.0491695404052734} +11/06/2021 21:45:23 - INFO - __main__ - Step 3505: {'lr': 0.0004998726071326896, 'samples': 672960, 'steps': 3504, 'loss/train': 1.6065165996551514} +11/06/2021 21:45:23 - INFO - __main__ - Step 3506: {'lr': 0.0004998724376853754, 'samples': 673152, 'steps': 3505, 'loss/train': 1.9586995840072632} +11/06/2021 21:45:24 - INFO - __main__ - Step 3507: {'lr': 0.0004998722681254725, 'samples': 673344, 'steps': 3506, 'loss/train': 1.835058569908142} +11/06/2021 21:45:24 - INFO - __main__ - Step 3508: {'lr': 0.0004998720984529811, 'samples': 673536, 'steps': 3507, 'loss/train': 2.592658519744873} +11/06/2021 21:45:25 - INFO - __main__ - Step 3509: {'lr': 0.0004998719286679011, 'samples': 673728, 'steps': 3508, 'loss/train': 1.8576128482818604} +11/06/2021 21:45:25 - INFO - __main__ - Step 3510: {'lr': 0.0004998717587702328, 'samples': 673920, 'steps': 3509, 'loss/train': 1.9809731245040894} +11/06/2021 21:45:26 - INFO - __main__ - Step 3511: {'lr': 0.0004998715887599759, 'samples': 674112, 'steps': 3510, 'loss/train': 1.734330415725708} +11/06/2021 21:45:26 - INFO - __main__ - Step 3512: {'lr': 0.000499871418637131, 'samples': 674304, 'steps': 3511, 'loss/train': 1.7968868017196655} +11/06/2021 21:45:26 - INFO - __main__ - Step 3513: {'lr': 0.0004998712484016977, 'samples': 674496, 'steps': 3512, 'loss/train': 2.3915631771087646} +11/06/2021 21:45:27 - INFO - __main__ - Step 3514: {'lr': 0.0004998710780536763, 'samples': 674688, 'steps': 3513, 'loss/train': 2.1563174724578857} +11/06/2021 21:45:28 - INFO - __main__ - Step 3515: {'lr': 0.0004998709075930669, 'samples': 674880, 'steps': 3514, 'loss/train': 1.6511495113372803} +11/06/2021 21:45:28 - INFO - __main__ - Step 3516: {'lr': 0.0004998707370198695, 'samples': 675072, 'steps': 3515, 'loss/train': 2.0000085830688477} +11/06/2021 21:45:28 - INFO - __main__ - Step 3517: {'lr': 0.0004998705663340843, 'samples': 675264, 'steps': 3516, 'loss/train': 1.445250153541565} +11/06/2021 21:45:29 - INFO - __main__ - Step 3518: {'lr': 0.0004998703955357111, 'samples': 675456, 'steps': 3517, 'loss/train': 1.4034719467163086} +11/06/2021 21:45:30 - INFO - __main__ - Step 3519: {'lr': 0.0004998702246247502, 'samples': 675648, 'steps': 3518, 'loss/train': 2.529625415802002} +11/06/2021 21:45:30 - INFO - __main__ - Step 3520: {'lr': 0.0004998700536012017, 'samples': 675840, 'steps': 3519, 'loss/train': 2.3188982009887695} +11/06/2021 21:45:30 - INFO - __main__ - Step 3521: {'lr': 0.0004998698824650655, 'samples': 676032, 'steps': 3520, 'loss/train': 0.6927474737167358} +11/06/2021 21:45:31 - INFO - __main__ - Step 3522: {'lr': 0.000499869711216342, 'samples': 676224, 'steps': 3521, 'loss/train': 1.4308483600616455} +11/06/2021 21:45:31 - INFO - __main__ - Step 3523: {'lr': 0.0004998695398550309, 'samples': 676416, 'steps': 3522, 'loss/train': 2.8342642784118652} +11/06/2021 21:45:32 - INFO - __main__ - Step 3524: {'lr': 0.0004998693683811325, 'samples': 676608, 'steps': 3523, 'loss/train': 2.05680513381958} +11/06/2021 21:45:32 - INFO - __main__ - Step 3525: {'lr': 0.0004998691967946468, 'samples': 676800, 'steps': 3524, 'loss/train': 2.1919660568237305} +11/06/2021 21:45:33 - INFO - __main__ - Step 3526: {'lr': 0.000499869025095574, 'samples': 676992, 'steps': 3525, 'loss/train': 1.6675937175750732} +11/06/2021 21:45:33 - INFO - __main__ - Step 3527: {'lr': 0.0004998688532839139, 'samples': 677184, 'steps': 3526, 'loss/train': 2.5993382930755615} +11/06/2021 21:45:34 - INFO - __main__ - Step 3528: {'lr': 0.0004998686813596668, 'samples': 677376, 'steps': 3527, 'loss/train': 2.326568126678467} +11/06/2021 21:45:34 - INFO - __main__ - Step 3529: {'lr': 0.0004998685093228327, 'samples': 677568, 'steps': 3528, 'loss/train': 1.6023788452148438} +11/06/2021 21:45:35 - INFO - __main__ - Step 3530: {'lr': 0.0004998683371734118, 'samples': 677760, 'steps': 3529, 'loss/train': 1.248134732246399} +11/06/2021 21:45:35 - INFO - __main__ - Step 3531: {'lr': 0.000499868164911404, 'samples': 677952, 'steps': 3530, 'loss/train': 1.8184454441070557} +11/06/2021 21:45:36 - INFO - __main__ - Step 3532: {'lr': 0.0004998679925368094, 'samples': 678144, 'steps': 3531, 'loss/train': 1.9451133012771606} +11/06/2021 21:45:36 - INFO - __main__ - Step 3533: {'lr': 0.0004998678200496283, 'samples': 678336, 'steps': 3532, 'loss/train': 2.026451587677002} +11/06/2021 21:45:36 - INFO - __main__ - Step 3534: {'lr': 0.0004998676474498606, 'samples': 678528, 'steps': 3533, 'loss/train': 1.7797132730484009} +11/06/2021 21:45:37 - INFO - __main__ - Step 3535: {'lr': 0.0004998674747375063, 'samples': 678720, 'steps': 3534, 'loss/train': 2.1139495372772217} +11/06/2021 21:45:38 - INFO - __main__ - Step 3536: {'lr': 0.0004998673019125657, 'samples': 678912, 'steps': 3535, 'loss/train': 2.0227255821228027} +11/06/2021 21:45:38 - INFO - __main__ - Step 3537: {'lr': 0.0004998671289750386, 'samples': 679104, 'steps': 3536, 'loss/train': 2.357372283935547} +11/06/2021 21:45:38 - INFO - __main__ - Step 3538: {'lr': 0.0004998669559249252, 'samples': 679296, 'steps': 3537, 'loss/train': 2.0382673740386963} +11/06/2021 21:45:39 - INFO - __main__ - Step 3539: {'lr': 0.0004998667827622258, 'samples': 679488, 'steps': 3538, 'loss/train': 1.8378405570983887} +11/06/2021 21:45:40 - INFO - __main__ - Step 3540: {'lr': 0.0004998666094869402, 'samples': 679680, 'steps': 3539, 'loss/train': 1.9578657150268555} +11/06/2021 21:45:40 - INFO - __main__ - Step 3541: {'lr': 0.0004998664360990685, 'samples': 679872, 'steps': 3540, 'loss/train': 2.1692068576812744} +11/06/2021 21:45:41 - INFO - __main__ - Step 3542: {'lr': 0.0004998662625986109, 'samples': 680064, 'steps': 3541, 'loss/train': 1.96601140499115} +11/06/2021 21:45:41 - INFO - __main__ - Step 3543: {'lr': 0.0004998660889855674, 'samples': 680256, 'steps': 3542, 'loss/train': 2.4479618072509766} +11/06/2021 21:45:41 - INFO - __main__ - Step 3544: {'lr': 0.0004998659152599381, 'samples': 680448, 'steps': 3543, 'loss/train': 2.9186902046203613} +11/06/2021 21:45:43 - INFO - __main__ - Step 3545: {'lr': 0.000499865741421723, 'samples': 680640, 'steps': 3544, 'loss/train': 1.9552292823791504} +11/06/2021 21:45:43 - INFO - __main__ - Step 3546: {'lr': 0.0004998655674709224, 'samples': 680832, 'steps': 3545, 'loss/train': 2.1400067806243896} +11/06/2021 21:45:43 - INFO - __main__ - Step 3547: {'lr': 0.0004998653934075361, 'samples': 681024, 'steps': 3546, 'loss/train': 2.2904787063598633} +11/06/2021 21:45:44 - INFO - __main__ - Step 3548: {'lr': 0.0004998652192315644, 'samples': 681216, 'steps': 3547, 'loss/train': 1.8039276599884033} +11/06/2021 21:45:44 - INFO - __main__ - Step 3549: {'lr': 0.0004998650449430073, 'samples': 681408, 'steps': 3548, 'loss/train': 1.7798856496810913} +11/06/2021 21:45:45 - INFO - __main__ - Step 3550: {'lr': 0.0004998648705418648, 'samples': 681600, 'steps': 3549, 'loss/train': 1.5824065208435059} +11/06/2021 21:45:45 - INFO - __main__ - Step 3551: {'lr': 0.000499864696028137, 'samples': 681792, 'steps': 3550, 'loss/train': 1.8516236543655396} +11/06/2021 21:45:46 - INFO - __main__ - Step 3552: {'lr': 0.000499864521401824, 'samples': 681984, 'steps': 3551, 'loss/train': 2.100595474243164} +11/06/2021 21:45:46 - INFO - __main__ - Step 3553: {'lr': 0.000499864346662926, 'samples': 682176, 'steps': 3552, 'loss/train': 2.4325428009033203} +11/06/2021 21:45:46 - INFO - __main__ - Step 3554: {'lr': 0.000499864171811443, 'samples': 682368, 'steps': 3553, 'loss/train': 1.2289140224456787} +11/06/2021 21:45:47 - INFO - __main__ - Step 3555: {'lr': 0.0004998639968473751, 'samples': 682560, 'steps': 3554, 'loss/train': 2.2943685054779053} +11/06/2021 21:45:48 - INFO - __main__ - Step 3556: {'lr': 0.0004998638217707222, 'samples': 682752, 'steps': 3555, 'loss/train': 2.264774799346924} +11/06/2021 21:45:48 - INFO - __main__ - Step 3557: {'lr': 0.0004998636465814846, 'samples': 682944, 'steps': 3556, 'loss/train': 1.637046217918396} +11/06/2021 21:45:48 - INFO - __main__ - Step 3558: {'lr': 0.0004998634712796622, 'samples': 683136, 'steps': 3557, 'loss/train': 2.0852251052856445} +11/06/2021 21:45:49 - INFO - __main__ - Step 3559: {'lr': 0.0004998632958652554, 'samples': 683328, 'steps': 3558, 'loss/train': 1.820117473602295} +11/06/2021 21:45:50 - INFO - __main__ - Step 3560: {'lr': 0.0004998631203382639, 'samples': 683520, 'steps': 3559, 'loss/train': 2.074711561203003} +11/06/2021 21:45:50 - INFO - __main__ - Step 3561: {'lr': 0.0004998629446986879, 'samples': 683712, 'steps': 3560, 'loss/train': 2.1228792667388916} +11/06/2021 21:45:51 - INFO - __main__ - Step 3562: {'lr': 0.0004998627689465276, 'samples': 683904, 'steps': 3561, 'loss/train': 2.0950121879577637} +11/06/2021 21:45:51 - INFO - __main__ - Step 3563: {'lr': 0.0004998625930817829, 'samples': 684096, 'steps': 3562, 'loss/train': 2.041194200515747} +11/06/2021 21:45:51 - INFO - __main__ - Step 3564: {'lr': 0.0004998624171044541, 'samples': 684288, 'steps': 3563, 'loss/train': 1.9695250988006592} +11/06/2021 21:45:52 - INFO - __main__ - Step 3565: {'lr': 0.000499862241014541, 'samples': 684480, 'steps': 3564, 'loss/train': 2.691624164581299} +11/06/2021 21:45:53 - INFO - __main__ - Step 3566: {'lr': 0.0004998620648120439, 'samples': 684672, 'steps': 3565, 'loss/train': 1.932613730430603} +11/06/2021 21:45:53 - INFO - __main__ - Step 3567: {'lr': 0.0004998618884969628, 'samples': 684864, 'steps': 3566, 'loss/train': 2.155407190322876} +11/06/2021 21:45:53 - INFO - __main__ - Step 3568: {'lr': 0.0004998617120692977, 'samples': 685056, 'steps': 3567, 'loss/train': 1.8647109270095825} +11/06/2021 21:45:54 - INFO - __main__ - Step 3569: {'lr': 0.0004998615355290489, 'samples': 685248, 'steps': 3568, 'loss/train': 0.48862022161483765} +11/06/2021 21:45:55 - INFO - __main__ - Step 3570: {'lr': 0.0004998613588762163, 'samples': 685440, 'steps': 3569, 'loss/train': 2.087411642074585} +11/06/2021 21:45:55 - INFO - __main__ - Step 3571: {'lr': 0.0004998611821108001, 'samples': 685632, 'steps': 3570, 'loss/train': 2.365281820297241} +11/06/2021 21:45:55 - INFO - __main__ - Step 3572: {'lr': 0.0004998610052328002, 'samples': 685824, 'steps': 3571, 'loss/train': 1.9633747339248657} +11/06/2021 21:45:56 - INFO - __main__ - Step 3573: {'lr': 0.0004998608282422169, 'samples': 686016, 'steps': 3572, 'loss/train': 2.195950746536255} +11/06/2021 21:45:56 - INFO - __main__ - Step 3574: {'lr': 0.0004998606511390501, 'samples': 686208, 'steps': 3573, 'loss/train': 1.7376683950424194} +11/06/2021 21:45:56 - INFO - __main__ - Step 3575: {'lr': 0.0004998604739232999, 'samples': 686400, 'steps': 3574, 'loss/train': 2.2785563468933105} +11/06/2021 21:45:58 - INFO - __main__ - Step 3576: {'lr': 0.0004998602965949664, 'samples': 686592, 'steps': 3575, 'loss/train': 1.848177433013916} +11/06/2021 21:45:58 - INFO - __main__ - Step 3577: {'lr': 0.0004998601191540499, 'samples': 686784, 'steps': 3576, 'loss/train': 2.7372477054595947} +11/06/2021 21:45:58 - INFO - __main__ - Step 3578: {'lr': 0.0004998599416005502, 'samples': 686976, 'steps': 3577, 'loss/train': 2.2560975551605225} +11/06/2021 21:45:59 - INFO - __main__ - Step 3579: {'lr': 0.0004998597639344674, 'samples': 687168, 'steps': 3578, 'loss/train': 2.355379819869995} +11/06/2021 21:45:59 - INFO - __main__ - Step 3580: {'lr': 0.0004998595861558016, 'samples': 687360, 'steps': 3579, 'loss/train': 2.119218111038208} +11/06/2021 21:46:00 - INFO - __main__ - Step 3581: {'lr': 0.000499859408264553, 'samples': 687552, 'steps': 3580, 'loss/train': 1.7983760833740234} +11/06/2021 21:46:00 - INFO - __main__ - Step 3582: {'lr': 0.0004998592302607217, 'samples': 687744, 'steps': 3581, 'loss/train': 2.229571580886841} +11/06/2021 21:46:01 - INFO - __main__ - Step 3583: {'lr': 0.0004998590521443075, 'samples': 687936, 'steps': 3582, 'loss/train': 1.9575389623641968} +11/06/2021 21:46:01 - INFO - __main__ - Step 3584: {'lr': 0.0004998588739153108, 'samples': 688128, 'steps': 3583, 'loss/train': 1.7447315454483032} +11/06/2021 21:46:01 - INFO - __main__ - Step 3585: {'lr': 0.0004998586955737316, 'samples': 688320, 'steps': 3584, 'loss/train': 2.1006550788879395} +11/06/2021 21:46:02 - INFO - __main__ - Step 3586: {'lr': 0.0004998585171195698, 'samples': 688512, 'steps': 3585, 'loss/train': 3.3587646484375} +11/06/2021 21:46:03 - INFO - __main__ - Step 3587: {'lr': 0.0004998583385528256, 'samples': 688704, 'steps': 3586, 'loss/train': 2.2408502101898193} +11/06/2021 21:46:03 - INFO - __main__ - Step 3588: {'lr': 0.0004998581598734991, 'samples': 688896, 'steps': 3587, 'loss/train': 1.8953609466552734} +11/06/2021 21:46:04 - INFO - __main__ - Step 3589: {'lr': 0.0004998579810815905, 'samples': 689088, 'steps': 3588, 'loss/train': 2.701934576034546} +11/06/2021 21:46:04 - INFO - __main__ - Step 3590: {'lr': 0.0004998578021770995, 'samples': 689280, 'steps': 3589, 'loss/train': 1.9593024253845215} +11/06/2021 21:46:05 - INFO - __main__ - Step 3591: {'lr': 0.0004998576231600267, 'samples': 689472, 'steps': 3590, 'loss/train': 1.8404669761657715} +11/06/2021 21:46:05 - INFO - __main__ - Step 3592: {'lr': 0.0004998574440303718, 'samples': 689664, 'steps': 3591, 'loss/train': 2.3145079612731934} +11/06/2021 21:46:06 - INFO - __main__ - Step 3593: {'lr': 0.0004998572647881349, 'samples': 689856, 'steps': 3592, 'loss/train': 1.889504075050354} +11/06/2021 21:46:06 - INFO - __main__ - Step 3594: {'lr': 0.0004998570854333163, 'samples': 690048, 'steps': 3593, 'loss/train': 1.687559962272644} +11/06/2021 21:46:06 - INFO - __main__ - Step 3595: {'lr': 0.0004998569059659158, 'samples': 690240, 'steps': 3594, 'loss/train': 1.928205966949463} +11/06/2021 21:46:07 - INFO - __main__ - Step 3596: {'lr': 0.0004998567263859338, 'samples': 690432, 'steps': 3595, 'loss/train': 2.1471500396728516} +11/06/2021 21:46:08 - INFO - __main__ - Step 3597: {'lr': 0.0004998565466933702, 'samples': 690624, 'steps': 3596, 'loss/train': 2.6100289821624756} +11/06/2021 21:46:08 - INFO - __main__ - Step 3598: {'lr': 0.000499856366888225, 'samples': 690816, 'steps': 3597, 'loss/train': 1.6505409479141235} +11/06/2021 21:46:08 - INFO - __main__ - Step 3599: {'lr': 0.0004998561869704983, 'samples': 691008, 'steps': 3598, 'loss/train': 1.5047534704208374} +11/06/2021 21:46:09 - INFO - __main__ - Step 3600: {'lr': 0.0004998560069401905, 'samples': 691200, 'steps': 3599, 'loss/train': 2.1573095321655273} +11/06/2021 21:46:10 - INFO - __main__ - Step 3601: {'lr': 0.0004998558267973013, 'samples': 691392, 'steps': 3600, 'loss/train': 2.1335763931274414} +11/06/2021 21:46:10 - INFO - __main__ - Step 3602: {'lr': 0.0004998556465418309, 'samples': 691584, 'steps': 3601, 'loss/train': 2.135831832885742} +11/06/2021 21:46:11 - INFO - __main__ - Step 3603: {'lr': 0.0004998554661737795, 'samples': 691776, 'steps': 3602, 'loss/train': 2.5998644828796387} +11/06/2021 21:46:11 - INFO - __main__ - Step 3604: {'lr': 0.000499855285693147, 'samples': 691968, 'steps': 3603, 'loss/train': 2.1776552200317383} +11/06/2021 21:46:11 - INFO - __main__ - Step 3605: {'lr': 0.0004998551050999336, 'samples': 692160, 'steps': 3604, 'loss/train': 1.8231139183044434} +11/06/2021 21:46:12 - INFO - __main__ - Step 3606: {'lr': 0.0004998549243941393, 'samples': 692352, 'steps': 3605, 'loss/train': 1.756971001625061} +11/06/2021 21:46:13 - INFO - __main__ - Step 3607: {'lr': 0.0004998547435757643, 'samples': 692544, 'steps': 3606, 'loss/train': 1.6793618202209473} +11/06/2021 21:46:13 - INFO - __main__ - Step 3608: {'lr': 0.0004998545626448087, 'samples': 692736, 'steps': 3607, 'loss/train': 2.033261299133301} +11/06/2021 21:46:13 - INFO - __main__ - Step 3609: {'lr': 0.0004998543816012723, 'samples': 692928, 'steps': 3608, 'loss/train': 2.1296401023864746} +11/06/2021 21:46:14 - INFO - __main__ - Step 3610: {'lr': 0.0004998542004451554, 'samples': 693120, 'steps': 3609, 'loss/train': 2.213966131210327} +11/06/2021 21:46:14 - INFO - __main__ - Step 3611: {'lr': 0.000499854019176458, 'samples': 693312, 'steps': 3610, 'loss/train': 2.0920517444610596} +11/06/2021 21:46:15 - INFO - __main__ - Step 3612: {'lr': 0.0004998538377951803, 'samples': 693504, 'steps': 3611, 'loss/train': 0.8657620549201965} +11/06/2021 21:46:15 - INFO - __main__ - Step 3613: {'lr': 0.0004998536563013224, 'samples': 693696, 'steps': 3612, 'loss/train': 2.072887659072876} +11/06/2021 21:46:16 - INFO - __main__ - Step 3614: {'lr': 0.0004998534746948843, 'samples': 693888, 'steps': 3613, 'loss/train': 1.9264954328536987} +11/06/2021 21:46:16 - INFO - __main__ - Step 3615: {'lr': 0.000499853292975866, 'samples': 694080, 'steps': 3614, 'loss/train': 0.808038592338562} +11/06/2021 21:46:16 - INFO - __main__ - Step 3616: {'lr': 0.0004998531111442676, 'samples': 694272, 'steps': 3615, 'loss/train': 1.6517269611358643} +11/06/2021 21:46:18 - INFO - __main__ - Step 3617: {'lr': 0.0004998529292000893, 'samples': 694464, 'steps': 3616, 'loss/train': 2.1595749855041504} +11/06/2021 21:46:18 - INFO - __main__ - Step 3618: {'lr': 0.0004998527471433312, 'samples': 694656, 'steps': 3617, 'loss/train': 1.3440548181533813} +11/06/2021 21:46:18 - INFO - __main__ - Step 3619: {'lr': 0.0004998525649739932, 'samples': 694848, 'steps': 3618, 'loss/train': 1.8935426473617554} +11/06/2021 21:46:19 - INFO - __main__ - Step 3620: {'lr': 0.0004998523826920756, 'samples': 695040, 'steps': 3619, 'loss/train': 2.0238497257232666} +11/06/2021 21:46:19 - INFO - __main__ - Step 3621: {'lr': 0.0004998522002975783, 'samples': 695232, 'steps': 3620, 'loss/train': 2.4836816787719727} +11/06/2021 21:46:20 - INFO - __main__ - Step 3622: {'lr': 0.0004998520177905015, 'samples': 695424, 'steps': 3621, 'loss/train': 1.8629294633865356} +11/06/2021 21:46:20 - INFO - __main__ - Step 3623: {'lr': 0.0004998518351708452, 'samples': 695616, 'steps': 3622, 'loss/train': 2.230546712875366} +11/06/2021 21:46:21 - INFO - __main__ - Step 3624: {'lr': 0.0004998516524386095, 'samples': 695808, 'steps': 3623, 'loss/train': 2.3679111003875732} +11/06/2021 21:46:21 - INFO - __main__ - Step 3625: {'lr': 0.0004998514695937945, 'samples': 696000, 'steps': 3624, 'loss/train': 2.3775951862335205} +11/06/2021 21:46:21 - INFO - __main__ - Step 3626: {'lr': 0.0004998512866364003, 'samples': 696192, 'steps': 3625, 'loss/train': 1.8260321617126465} +11/06/2021 21:46:23 - INFO - __main__ - Step 3627: {'lr': 0.000499851103566427, 'samples': 696384, 'steps': 3626, 'loss/train': 2.3718161582946777} +11/06/2021 21:46:24 - INFO - __main__ - Step 3628: {'lr': 0.0004998509203838746, 'samples': 696576, 'steps': 3627, 'loss/train': 2.2593507766723633} +11/06/2021 21:46:24 - INFO - __main__ - Step 3629: {'lr': 0.0004998507370887433, 'samples': 696768, 'steps': 3628, 'loss/train': 2.683199882507324} +11/06/2021 21:46:24 - INFO - __main__ - Step 3630: {'lr': 0.000499850553681033, 'samples': 696960, 'steps': 3629, 'loss/train': 3.9143762588500977} +11/06/2021 21:46:25 - INFO - __main__ - Step 3631: {'lr': 0.000499850370160744, 'samples': 697152, 'steps': 3630, 'loss/train': 5.931422233581543} +11/06/2021 21:46:25 - INFO - __main__ - Step 3632: {'lr': 0.0004998501865278762, 'samples': 697344, 'steps': 3631, 'loss/train': 1.1052885055541992} +11/06/2021 21:46:25 - INFO - __main__ - Step 3633: {'lr': 0.0004998500027824298, 'samples': 697536, 'steps': 3632, 'loss/train': 1.352131724357605} +11/06/2021 21:46:26 - INFO - __main__ - Step 3634: {'lr': 0.0004998498189244049, 'samples': 697728, 'steps': 3633, 'loss/train': 2.097627639770508} +11/06/2021 21:46:27 - INFO - __main__ - Step 3635: {'lr': 0.0004998496349538015, 'samples': 697920, 'steps': 3634, 'loss/train': 2.872110605239868} +11/06/2021 21:46:27 - INFO - __main__ - Step 3636: {'lr': 0.0004998494508706196, 'samples': 698112, 'steps': 3635, 'loss/train': 1.6961387395858765} +11/06/2021 21:46:27 - INFO - __main__ - Step 3637: {'lr': 0.0004998492666748594, 'samples': 698304, 'steps': 3636, 'loss/train': 2.1306369304656982} +11/06/2021 21:46:28 - INFO - __main__ - Step 3638: {'lr': 0.0004998490823665211, 'samples': 698496, 'steps': 3637, 'loss/train': 2.1220192909240723} +11/06/2021 21:46:29 - INFO - __main__ - Step 3639: {'lr': 0.0004998488979456046, 'samples': 698688, 'steps': 3638, 'loss/train': 2.4169700145721436} +11/06/2021 21:46:29 - INFO - __main__ - Step 3640: {'lr': 0.00049984871341211, 'samples': 698880, 'steps': 3639, 'loss/train': 2.1508548259735107} +11/06/2021 21:46:30 - INFO - __main__ - Step 3641: {'lr': 0.0004998485287660375, 'samples': 699072, 'steps': 3640, 'loss/train': 2.348625898361206} +11/06/2021 21:46:30 - INFO - __main__ - Step 3642: {'lr': 0.0004998483440073871, 'samples': 699264, 'steps': 3641, 'loss/train': 2.3207335472106934} +11/06/2021 21:46:30 - INFO - __main__ - Step 3643: {'lr': 0.0004998481591361589, 'samples': 699456, 'steps': 3642, 'loss/train': 2.584690570831299} +11/06/2021 21:46:31 - INFO - __main__ - Step 3644: {'lr': 0.000499847974152353, 'samples': 699648, 'steps': 3643, 'loss/train': 1.8976331949234009} +11/06/2021 21:46:32 - INFO - __main__ - Step 3645: {'lr': 0.0004998477890559693, 'samples': 699840, 'steps': 3644, 'loss/train': 1.7949036359786987} +11/06/2021 21:46:32 - INFO - __main__ - Step 3646: {'lr': 0.0004998476038470082, 'samples': 700032, 'steps': 3645, 'loss/train': 2.1402628421783447} +11/06/2021 21:46:32 - INFO - __main__ - Step 3647: {'lr': 0.0004998474185254696, 'samples': 700224, 'steps': 3646, 'loss/train': 2.140929937362671} +11/06/2021 21:46:33 - INFO - __main__ - Step 3648: {'lr': 0.0004998472330913535, 'samples': 700416, 'steps': 3647, 'loss/train': 1.1526223421096802} +11/06/2021 21:46:34 - INFO - __main__ - Step 3649: {'lr': 0.0004998470475446603, 'samples': 700608, 'steps': 3648, 'loss/train': 2.2785234451293945} +11/06/2021 21:46:34 - INFO - __main__ - Step 3650: {'lr': 0.0004998468618853896, 'samples': 700800, 'steps': 3649, 'loss/train': 2.1500542163848877} +11/06/2021 21:46:35 - INFO - __main__ - Step 3651: {'lr': 0.000499846676113542, 'samples': 700992, 'steps': 3650, 'loss/train': 2.041510820388794} +11/06/2021 21:46:35 - INFO - __main__ - Step 3652: {'lr': 0.0004998464902291173, 'samples': 701184, 'steps': 3651, 'loss/train': 2.313647985458374} +11/06/2021 21:46:35 - INFO - __main__ - Step 3653: {'lr': 0.0004998463042321155, 'samples': 701376, 'steps': 3652, 'loss/train': 1.6131926774978638} +11/06/2021 21:46:36 - INFO - __main__ - Step 3654: {'lr': 0.0004998461181225369, 'samples': 701568, 'steps': 3653, 'loss/train': 2.0128300189971924} +11/06/2021 21:46:37 - INFO - __main__ - Step 3655: {'lr': 0.0004998459319003815, 'samples': 701760, 'steps': 3654, 'loss/train': 2.388474464416504} +11/06/2021 21:46:37 - INFO - __main__ - Step 3656: {'lr': 0.0004998457455656493, 'samples': 701952, 'steps': 3655, 'loss/train': 1.8429226875305176} +11/06/2021 21:46:37 - INFO - __main__ - Step 3657: {'lr': 0.0004998455591183406, 'samples': 702144, 'steps': 3656, 'loss/train': 2.267188310623169} +11/06/2021 21:46:38 - INFO - __main__ - Step 3658: {'lr': 0.0004998453725584552, 'samples': 702336, 'steps': 3657, 'loss/train': 2.0592057704925537} +11/06/2021 21:46:39 - INFO - __main__ - Step 3659: {'lr': 0.0004998451858859934, 'samples': 702528, 'steps': 3658, 'loss/train': 1.9567612409591675} +11/06/2021 21:46:39 - INFO - __main__ - Step 3660: {'lr': 0.0004998449991009552, 'samples': 702720, 'steps': 3659, 'loss/train': 2.084226608276367} +11/06/2021 21:46:39 - INFO - __main__ - Step 3661: {'lr': 0.0004998448122033408, 'samples': 702912, 'steps': 3660, 'loss/train': 2.5636651515960693} +11/06/2021 21:46:40 - INFO - __main__ - Step 3662: {'lr': 0.00049984462519315, 'samples': 703104, 'steps': 3661, 'loss/train': 2.506985664367676} +11/06/2021 21:46:40 - INFO - __main__ - Step 3663: {'lr': 0.0004998444380703832, 'samples': 703296, 'steps': 3662, 'loss/train': 2.208871603012085} +11/06/2021 21:46:41 - INFO - __main__ - Step 3664: {'lr': 0.0004998442508350404, 'samples': 703488, 'steps': 3663, 'loss/train': 2.199995994567871} +11/06/2021 21:46:41 - INFO - __main__ - Step 3665: {'lr': 0.0004998440634871215, 'samples': 703680, 'steps': 3664, 'loss/train': 1.8999465703964233} +11/06/2021 21:46:42 - INFO - __main__ - Step 3666: {'lr': 0.0004998438760266267, 'samples': 703872, 'steps': 3665, 'loss/train': 2.107455253601074} +11/06/2021 21:46:42 - INFO - __main__ - Step 3667: {'lr': 0.0004998436884535562, 'samples': 704064, 'steps': 3666, 'loss/train': 1.854463815689087} +11/06/2021 21:46:42 - INFO - __main__ - Step 3668: {'lr': 0.00049984350076791, 'samples': 704256, 'steps': 3667, 'loss/train': 2.7667548656463623} +11/06/2021 21:46:44 - INFO - __main__ - Step 3669: {'lr': 0.0004998433129696882, 'samples': 704448, 'steps': 3668, 'loss/train': 1.5981824398040771} +11/06/2021 21:46:44 - INFO - __main__ - Step 3670: {'lr': 0.0004998431250588907, 'samples': 704640, 'steps': 3669, 'loss/train': 2.160209894180298} +11/06/2021 21:46:44 - INFO - __main__ - Step 3671: {'lr': 0.0004998429370355179, 'samples': 704832, 'steps': 3670, 'loss/train': 1.8680161237716675} +11/06/2021 21:46:45 - INFO - __main__ - Step 3672: {'lr': 0.0004998427488995697, 'samples': 705024, 'steps': 3671, 'loss/train': 2.518526315689087} +11/06/2021 21:46:45 - INFO - __main__ - Step 3673: {'lr': 0.0004998425606510461, 'samples': 705216, 'steps': 3672, 'loss/train': 2.714362621307373} +11/06/2021 21:46:45 - INFO - __main__ - Step 3674: {'lr': 0.0004998423722899475, 'samples': 705408, 'steps': 3673, 'loss/train': 1.8246042728424072} +11/06/2021 21:46:46 - INFO - __main__ - Step 3675: {'lr': 0.0004998421838162735, 'samples': 705600, 'steps': 3674, 'loss/train': 0.9275121688842773} +11/06/2021 21:46:47 - INFO - __main__ - Step 3676: {'lr': 0.0004998419952300247, 'samples': 705792, 'steps': 3675, 'loss/train': 2.0111794471740723} +11/06/2021 21:46:47 - INFO - __main__ - Step 3677: {'lr': 0.0004998418065312009, 'samples': 705984, 'steps': 3676, 'loss/train': 1.89971923828125} +11/06/2021 21:46:47 - INFO - __main__ - Step 3678: {'lr': 0.0004998416177198022, 'samples': 706176, 'steps': 3677, 'loss/train': 1.930174708366394} +11/06/2021 21:46:48 - INFO - __main__ - Step 3679: {'lr': 0.0004998414287958288, 'samples': 706368, 'steps': 3678, 'loss/train': 2.1186258792877197} +11/06/2021 21:46:49 - INFO - __main__ - Step 3680: {'lr': 0.0004998412397592807, 'samples': 706560, 'steps': 3679, 'loss/train': 2.1540133953094482} +11/06/2021 21:46:49 - INFO - __main__ - Step 3681: {'lr': 0.0004998410506101579, 'samples': 706752, 'steps': 3680, 'loss/train': 1.5001546144485474} +11/06/2021 21:46:50 - INFO - __main__ - Step 3682: {'lr': 0.0004998408613484605, 'samples': 706944, 'steps': 3681, 'loss/train': 1.7224041223526} +11/06/2021 21:46:50 - INFO - __main__ - Step 3683: {'lr': 0.0004998406719741888, 'samples': 707136, 'steps': 3682, 'loss/train': 1.118072509765625} +11/06/2021 21:46:51 - INFO - __main__ - Step 3684: {'lr': 0.0004998404824873428, 'samples': 707328, 'steps': 3683, 'loss/train': 1.8773263692855835} +11/06/2021 21:46:51 - INFO - __main__ - Step 3685: {'lr': 0.0004998402928879225, 'samples': 707520, 'steps': 3684, 'loss/train': 1.9647787809371948} +11/06/2021 21:46:52 - INFO - __main__ - Step 3686: {'lr': 0.000499840103175928, 'samples': 707712, 'steps': 3685, 'loss/train': 2.2132978439331055} +11/06/2021 21:46:52 - INFO - __main__ - Step 3687: {'lr': 0.0004998399133513594, 'samples': 707904, 'steps': 3686, 'loss/train': 2.232158899307251} +11/06/2021 21:46:53 - INFO - __main__ - Step 3688: {'lr': 0.0004998397234142167, 'samples': 708096, 'steps': 3687, 'loss/train': 2.528634786605835} +11/06/2021 21:46:53 - INFO - __main__ - Step 3689: {'lr': 0.0004998395333645002, 'samples': 708288, 'steps': 3688, 'loss/train': 2.5124094486236572} +11/06/2021 21:46:54 - INFO - __main__ - Step 3690: {'lr': 0.0004998393432022098, 'samples': 708480, 'steps': 3689, 'loss/train': 2.4985034465789795} +11/06/2021 21:46:54 - INFO - __main__ - Step 3691: {'lr': 0.0004998391529273457, 'samples': 708672, 'steps': 3690, 'loss/train': 2.0140085220336914} +11/06/2021 21:46:55 - INFO - __main__ - Step 3692: {'lr': 0.0004998389625399079, 'samples': 708864, 'steps': 3691, 'loss/train': 1.7472585439682007} +11/06/2021 21:46:55 - INFO - __main__ - Step 3693: {'lr': 0.0004998387720398965, 'samples': 709056, 'steps': 3692, 'loss/train': 2.138169527053833} +11/06/2021 21:46:55 - INFO - __main__ - Step 3694: {'lr': 0.0004998385814273116, 'samples': 709248, 'steps': 3693, 'loss/train': 1.8398798704147339} +11/06/2021 21:46:56 - INFO - __main__ - Step 3695: {'lr': 0.0004998383907021533, 'samples': 709440, 'steps': 3694, 'loss/train': 2.2453384399414062} +11/06/2021 21:46:57 - INFO - __main__ - Step 3696: {'lr': 0.0004998381998644217, 'samples': 709632, 'steps': 3695, 'loss/train': 2.210822105407715} +11/06/2021 21:46:57 - INFO - __main__ - Step 3697: {'lr': 0.0004998380089141169, 'samples': 709824, 'steps': 3696, 'loss/train': 1.83198082447052} +11/06/2021 21:46:57 - INFO - __main__ - Step 3698: {'lr': 0.0004998378178512388, 'samples': 710016, 'steps': 3697, 'loss/train': 2.363736391067505} +11/06/2021 21:46:58 - INFO - __main__ - Step 3699: {'lr': 0.0004998376266757878, 'samples': 710208, 'steps': 3698, 'loss/train': 1.7178457975387573} +11/06/2021 21:46:58 - INFO - __main__ - Step 3700: {'lr': 0.0004998374353877638, 'samples': 710400, 'steps': 3699, 'loss/train': 1.9114118814468384} +11/06/2021 21:46:59 - INFO - __main__ - Step 3701: {'lr': 0.0004998372439871668, 'samples': 710592, 'steps': 3700, 'loss/train': 2.2929277420043945} +11/06/2021 21:46:59 - INFO - __main__ - Step 3702: {'lr': 0.000499837052473997, 'samples': 710784, 'steps': 3701, 'loss/train': 2.206447124481201} +11/06/2021 21:47:00 - INFO - __main__ - Step 3703: {'lr': 0.0004998368608482546, 'samples': 710976, 'steps': 3702, 'loss/train': 2.2719476222991943} +11/06/2021 21:47:00 - INFO - __main__ - Step 3704: {'lr': 0.0004998366691099395, 'samples': 711168, 'steps': 3703, 'loss/train': 1.9696950912475586} +11/06/2021 21:47:01 - INFO - __main__ - Step 3705: {'lr': 0.0004998364772590518, 'samples': 711360, 'steps': 3704, 'loss/train': 1.9279074668884277} +11/06/2021 21:47:02 - INFO - __main__ - Step 3706: {'lr': 0.0004998362852955918, 'samples': 711552, 'steps': 3705, 'loss/train': 2.3700718879699707} +11/06/2021 21:47:02 - INFO - __main__ - Step 3707: {'lr': 0.0004998360932195593, 'samples': 711744, 'steps': 3706, 'loss/train': 2.2039358615875244} +11/06/2021 21:47:02 - INFO - __main__ - Step 3708: {'lr': 0.0004998359010309544, 'samples': 711936, 'steps': 3707, 'loss/train': 2.483283758163452} +11/06/2021 21:47:03 - INFO - __main__ - Step 3709: {'lr': 0.0004998357087297775, 'samples': 712128, 'steps': 3708, 'loss/train': 1.5728569030761719} +11/06/2021 21:47:03 - INFO - __main__ - Step 3710: {'lr': 0.0004998355163160285, 'samples': 712320, 'steps': 3709, 'loss/train': 1.6009992361068726} +11/06/2021 21:47:04 - INFO - __main__ - Step 3711: {'lr': 0.0004998353237897073, 'samples': 712512, 'steps': 3710, 'loss/train': 2.459540605545044} +11/06/2021 21:47:04 - INFO - __main__ - Step 3712: {'lr': 0.0004998351311508143, 'samples': 712704, 'steps': 3711, 'loss/train': 1.7308366298675537} +11/06/2021 21:47:05 - INFO - __main__ - Step 3713: {'lr': 0.0004998349383993493, 'samples': 712896, 'steps': 3712, 'loss/train': 2.191849708557129} +11/06/2021 21:47:05 - INFO - __main__ - Step 3714: {'lr': 0.0004998347455353126, 'samples': 713088, 'steps': 3713, 'loss/train': 2.918881893157959} +11/06/2021 21:47:05 - INFO - __main__ - Step 3715: {'lr': 0.0004998345525587042, 'samples': 713280, 'steps': 3714, 'loss/train': 2.113539695739746} +11/06/2021 21:47:06 - INFO - __main__ - Step 3716: {'lr': 0.0004998343594695242, 'samples': 713472, 'steps': 3715, 'loss/train': 1.7858660221099854} +11/06/2021 21:47:07 - INFO - __main__ - Step 3717: {'lr': 0.0004998341662677728, 'samples': 713664, 'steps': 3716, 'loss/train': 1.8981730937957764} +11/06/2021 21:47:07 - INFO - __main__ - Step 3718: {'lr': 0.0004998339729534499, 'samples': 713856, 'steps': 3717, 'loss/train': 2.5536508560180664} +11/06/2021 21:47:07 - INFO - __main__ - Step 3719: {'lr': 0.0004998337795265557, 'samples': 714048, 'steps': 3718, 'loss/train': 2.2563905715942383} +11/06/2021 21:47:08 - INFO - __main__ - Step 3720: {'lr': 0.0004998335859870903, 'samples': 714240, 'steps': 3719, 'loss/train': 1.7998706102371216} +11/06/2021 21:47:09 - INFO - __main__ - Step 3721: {'lr': 0.0004998333923350536, 'samples': 714432, 'steps': 3720, 'loss/train': 2.0226428508758545} +11/06/2021 21:47:09 - INFO - __main__ - Step 3722: {'lr': 0.000499833198570446, 'samples': 714624, 'steps': 3721, 'loss/train': 1.3011538982391357} +11/06/2021 21:47:10 - INFO - __main__ - Step 3723: {'lr': 0.0004998330046932672, 'samples': 714816, 'steps': 3722, 'loss/train': 2.5336453914642334} +11/06/2021 21:47:10 - INFO - __main__ - Step 3724: {'lr': 0.0004998328107035176, 'samples': 715008, 'steps': 3723, 'loss/train': 2.392589807510376} +11/06/2021 21:47:10 - INFO - __main__ - Step 3725: {'lr': 0.0004998326166011973, 'samples': 715200, 'steps': 3724, 'loss/train': 2.1815335750579834} +11/06/2021 21:47:11 - INFO - __main__ - Step 3726: {'lr': 0.0004998324223863061, 'samples': 715392, 'steps': 3725, 'loss/train': 6.898614406585693} +11/06/2021 21:47:12 - INFO - __main__ - Step 3727: {'lr': 0.0004998322280588445, 'samples': 715584, 'steps': 3726, 'loss/train': 1.5503253936767578} +11/06/2021 21:47:12 - INFO - __main__ - Step 3728: {'lr': 0.0004998320336188121, 'samples': 715776, 'steps': 3727, 'loss/train': 2.2275030612945557} +11/06/2021 21:47:12 - INFO - __main__ - Step 3729: {'lr': 0.0004998318390662095, 'samples': 715968, 'steps': 3728, 'loss/train': 1.9741984605789185} +11/06/2021 21:47:13 - INFO - __main__ - Step 3730: {'lr': 0.0004998316444010363, 'samples': 716160, 'steps': 3729, 'loss/train': 1.3006471395492554} +11/06/2021 21:47:13 - INFO - __main__ - Step 3731: {'lr': 0.0004998314496232929, 'samples': 716352, 'steps': 3730, 'loss/train': 2.1504995822906494} +11/06/2021 21:47:14 - INFO - __main__ - Step 3732: {'lr': 0.0004998312547329793, 'samples': 716544, 'steps': 3731, 'loss/train': 2.3918561935424805} +11/06/2021 21:47:14 - INFO - __main__ - Step 3733: {'lr': 0.0004998310597300956, 'samples': 716736, 'steps': 3732, 'loss/train': 2.505441665649414} +11/06/2021 21:47:15 - INFO - __main__ - Step 3734: {'lr': 0.0004998308646146419, 'samples': 716928, 'steps': 3733, 'loss/train': 1.6491429805755615} +11/06/2021 21:47:15 - INFO - __main__ - Step 3735: {'lr': 0.0004998306693866181, 'samples': 717120, 'steps': 3734, 'loss/train': 2.3682384490966797} +11/06/2021 21:47:15 - INFO - __main__ - Step 3736: {'lr': 0.0004998304740460247, 'samples': 717312, 'steps': 3735, 'loss/train': 1.748855471611023} +11/06/2021 21:47:16 - INFO - __main__ - Step 3737: {'lr': 0.0004998302785928614, 'samples': 717504, 'steps': 3736, 'loss/train': 3.4032115936279297} +11/06/2021 21:47:17 - INFO - __main__ - Step 3738: {'lr': 0.0004998300830271285, 'samples': 717696, 'steps': 3737, 'loss/train': 2.2181355953216553} +11/06/2021 21:47:17 - INFO - __main__ - Step 3739: {'lr': 0.000499829887348826, 'samples': 717888, 'steps': 3738, 'loss/train': 2.0063092708587646} +11/06/2021 21:47:17 - INFO - __main__ - Step 3740: {'lr': 0.0004998296915579539, 'samples': 718080, 'steps': 3739, 'loss/train': 2.2116055488586426} +11/06/2021 21:47:18 - INFO - __main__ - Step 3741: {'lr': 0.0004998294956545125, 'samples': 718272, 'steps': 3740, 'loss/train': 2.458434820175171} +11/06/2021 21:47:19 - INFO - __main__ - Step 3742: {'lr': 0.0004998292996385019, 'samples': 718464, 'steps': 3741, 'loss/train': 2.001145839691162} +11/06/2021 21:47:19 - INFO - __main__ - Step 3743: {'lr': 0.0004998291035099219, 'samples': 718656, 'steps': 3742, 'loss/train': 1.889823079109192} +11/06/2021 21:47:20 - INFO - __main__ - Step 3744: {'lr': 0.0004998289072687728, 'samples': 718848, 'steps': 3743, 'loss/train': 2.2206709384918213} +11/06/2021 21:47:20 - INFO - __main__ - Step 3745: {'lr': 0.0004998287109150547, 'samples': 719040, 'steps': 3744, 'loss/train': 1.8798199892044067} +11/06/2021 21:47:20 - INFO - __main__ - Step 3746: {'lr': 0.0004998285144487676, 'samples': 719232, 'steps': 3745, 'loss/train': 2.057377576828003} +11/06/2021 21:47:21 - INFO - __main__ - Step 3747: {'lr': 0.0004998283178699116, 'samples': 719424, 'steps': 3746, 'loss/train': 1.8531581163406372} +11/06/2021 21:47:22 - INFO - __main__ - Step 3748: {'lr': 0.0004998281211784869, 'samples': 719616, 'steps': 3747, 'loss/train': 2.3435657024383545} +11/06/2021 21:47:22 - INFO - __main__ - Step 3749: {'lr': 0.0004998279243744934, 'samples': 719808, 'steps': 3748, 'loss/train': 2.2125914096832275} +11/06/2021 21:47:22 - INFO - __main__ - Step 3750: {'lr': 0.0004998277274579313, 'samples': 720000, 'steps': 3749, 'loss/train': 2.172743558883667} +11/06/2021 21:47:23 - INFO - __main__ - Step 3751: {'lr': 0.0004998275304288007, 'samples': 720192, 'steps': 3750, 'loss/train': 1.698510766029358} +11/06/2021 21:47:24 - INFO - __main__ - Step 3752: {'lr': 0.0004998273332871017, 'samples': 720384, 'steps': 3751, 'loss/train': 2.1584572792053223} +11/06/2021 21:47:24 - INFO - __main__ - Step 3753: {'lr': 0.0004998271360328344, 'samples': 720576, 'steps': 3752, 'loss/train': 1.8731579780578613} +11/06/2021 21:47:24 - INFO - __main__ - Step 3754: {'lr': 0.0004998269386659988, 'samples': 720768, 'steps': 3753, 'loss/train': 2.281588077545166} +11/06/2021 21:47:25 - INFO - __main__ - Step 3755: {'lr': 0.000499826741186595, 'samples': 720960, 'steps': 3754, 'loss/train': 2.172957420349121} +11/06/2021 21:47:25 - INFO - __main__ - Step 3756: {'lr': 0.0004998265435946232, 'samples': 721152, 'steps': 3755, 'loss/train': 2.0597519874572754} +11/06/2021 21:47:26 - INFO - __main__ - Step 3757: {'lr': 0.0004998263458900833, 'samples': 721344, 'steps': 3756, 'loss/train': 1.874323844909668} +11/06/2021 21:47:26 - INFO - __main__ - Step 3758: {'lr': 0.0004998261480729755, 'samples': 721536, 'steps': 3757, 'loss/train': 2.4779069423675537} +11/06/2021 21:47:27 - INFO - __main__ - Step 3759: {'lr': 0.0004998259501433, 'samples': 721728, 'steps': 3758, 'loss/train': 2.595695734024048} +11/06/2021 21:47:27 - INFO - __main__ - Step 3760: {'lr': 0.0004998257521010567, 'samples': 721920, 'steps': 3759, 'loss/train': 2.313114643096924} +11/06/2021 21:47:27 - INFO - __main__ - Step 3761: {'lr': 0.0004998255539462459, 'samples': 722112, 'steps': 3760, 'loss/train': 1.7417014837265015} +11/06/2021 21:47:28 - INFO - __main__ - Step 3762: {'lr': 0.0004998253556788675, 'samples': 722304, 'steps': 3761, 'loss/train': 2.088002920150757} +11/06/2021 21:47:29 - INFO - __main__ - Step 3763: {'lr': 0.0004998251572989217, 'samples': 722496, 'steps': 3762, 'loss/train': 2.2535784244537354} +11/06/2021 21:47:29 - INFO - __main__ - Step 3764: {'lr': 0.0004998249588064085, 'samples': 722688, 'steps': 3763, 'loss/train': 1.551037073135376} +11/06/2021 21:47:30 - INFO - __main__ - Step 3765: {'lr': 0.0004998247602013278, 'samples': 722880, 'steps': 3764, 'loss/train': 2.5815794467926025} +11/06/2021 21:47:30 - INFO - __main__ - Step 3766: {'lr': 0.0004998245614836802, 'samples': 723072, 'steps': 3765, 'loss/train': 2.278775930404663} +11/06/2021 21:47:30 - INFO - __main__ - Step 3767: {'lr': 0.0004998243626534655, 'samples': 723264, 'steps': 3766, 'loss/train': 2.4035115242004395} +11/06/2021 21:47:31 - INFO - __main__ - Step 3768: {'lr': 0.0004998241637106836, 'samples': 723456, 'steps': 3767, 'loss/train': 2.4984121322631836} +11/06/2021 21:47:32 - INFO - __main__ - Step 3769: {'lr': 0.0004998239646553349, 'samples': 723648, 'steps': 3768, 'loss/train': 1.8377968072891235} +11/06/2021 21:47:32 - INFO - __main__ - Step 3770: {'lr': 0.0004998237654874195, 'samples': 723840, 'steps': 3769, 'loss/train': 2.3453054428100586} +11/06/2021 21:47:32 - INFO - __main__ - Step 3771: {'lr': 0.0004998235662069372, 'samples': 724032, 'steps': 3770, 'loss/train': 1.7649283409118652} +11/06/2021 21:47:33 - INFO - __main__ - Step 3772: {'lr': 0.0004998233668138883, 'samples': 724224, 'steps': 3771, 'loss/train': 1.8481817245483398} +11/06/2021 21:47:34 - INFO - __main__ - Step 3773: {'lr': 0.0004998231673082729, 'samples': 724416, 'steps': 3772, 'loss/train': 2.0594215393066406} +11/06/2021 21:47:34 - INFO - __main__ - Step 3774: {'lr': 0.000499822967690091, 'samples': 724608, 'steps': 3773, 'loss/train': 2.3945000171661377} +11/06/2021 21:47:35 - INFO - __main__ - Step 3775: {'lr': 0.0004998227679593426, 'samples': 724800, 'steps': 3774, 'loss/train': 1.9772299528121948} +11/06/2021 21:47:35 - INFO - __main__ - Step 3776: {'lr': 0.0004998225681160281, 'samples': 724992, 'steps': 3775, 'loss/train': 1.82159423828125} +11/06/2021 21:47:35 - INFO - __main__ - Step 3777: {'lr': 0.0004998223681601474, 'samples': 725184, 'steps': 3776, 'loss/train': 2.3857104778289795} +11/06/2021 21:47:36 - INFO - __main__ - Step 3778: {'lr': 0.0004998221680917004, 'samples': 725376, 'steps': 3777, 'loss/train': 2.202800989151001} +11/06/2021 21:47:37 - INFO - __main__ - Step 3779: {'lr': 0.0004998219679106876, 'samples': 725568, 'steps': 3778, 'loss/train': 2.383378028869629} +11/06/2021 21:47:37 - INFO - __main__ - Step 3780: {'lr': 0.0004998217676171088, 'samples': 725760, 'steps': 3779, 'loss/train': 2.38877010345459} +11/06/2021 21:47:37 - INFO - __main__ - Step 3781: {'lr': 0.0004998215672109641, 'samples': 725952, 'steps': 3780, 'loss/train': 2.0370190143585205} +11/06/2021 21:47:38 - INFO - __main__ - Step 3782: {'lr': 0.0004998213666922537, 'samples': 726144, 'steps': 3781, 'loss/train': 1.9329248666763306} +11/06/2021 21:47:39 - INFO - __main__ - Step 3783: {'lr': 0.0004998211660609777, 'samples': 726336, 'steps': 3782, 'loss/train': 3.1192450523376465} +11/06/2021 21:47:39 - INFO - __main__ - Step 3784: {'lr': 0.0004998209653171361, 'samples': 726528, 'steps': 3783, 'loss/train': 0.4665497839450836} +11/06/2021 21:47:39 - INFO - __main__ - Step 3785: {'lr': 0.0004998207644607291, 'samples': 726720, 'steps': 3784, 'loss/train': 2.076326370239258} +11/06/2021 21:47:40 - INFO - __main__ - Step 3786: {'lr': 0.0004998205634917566, 'samples': 726912, 'steps': 3785, 'loss/train': 2.1383769512176514} +11/06/2021 21:47:40 - INFO - __main__ - Step 3787: {'lr': 0.0004998203624102188, 'samples': 727104, 'steps': 3786, 'loss/train': 2.3829987049102783} +11/06/2021 21:47:41 - INFO - __main__ - Step 3788: {'lr': 0.0004998201612161159, 'samples': 727296, 'steps': 3787, 'loss/train': 1.7519925832748413} +11/06/2021 21:47:42 - INFO - __main__ - Step 3789: {'lr': 0.0004998199599094478, 'samples': 727488, 'steps': 3788, 'loss/train': 1.9867311716079712} +11/06/2021 21:47:42 - INFO - __main__ - Step 3790: {'lr': 0.0004998197584902147, 'samples': 727680, 'steps': 3789, 'loss/train': 1.7998645305633545} +11/06/2021 21:47:42 - INFO - __main__ - Step 3791: {'lr': 0.0004998195569584168, 'samples': 727872, 'steps': 3790, 'loss/train': 2.279456377029419} +11/06/2021 21:47:43 - INFO - __main__ - Step 3792: {'lr': 0.0004998193553140539, 'samples': 728064, 'steps': 3791, 'loss/train': 1.8781626224517822} +11/06/2021 21:47:44 - INFO - __main__ - Step 3793: {'lr': 0.0004998191535571264, 'samples': 728256, 'steps': 3792, 'loss/train': 2.181241750717163} +11/06/2021 21:47:44 - INFO - __main__ - Step 3794: {'lr': 0.0004998189516876342, 'samples': 728448, 'steps': 3793, 'loss/train': 2.345247983932495} +11/06/2021 21:47:44 - INFO - __main__ - Step 3795: {'lr': 0.0004998187497055773, 'samples': 728640, 'steps': 3794, 'loss/train': 0.6545143723487854} +11/06/2021 21:47:45 - INFO - __main__ - Step 3796: {'lr': 0.000499818547610956, 'samples': 728832, 'steps': 3795, 'loss/train': 1.8099079132080078} +11/06/2021 21:47:45 - INFO - __main__ - Step 3797: {'lr': 0.0004998183454037703, 'samples': 729024, 'steps': 3796, 'loss/train': 1.515761137008667} +11/06/2021 21:47:45 - INFO - __main__ - Step 3798: {'lr': 0.0004998181430840204, 'samples': 729216, 'steps': 3797, 'loss/train': 1.9123553037643433} +11/06/2021 21:47:46 - INFO - __main__ - Step 3799: {'lr': 0.0004998179406517063, 'samples': 729408, 'steps': 3798, 'loss/train': 1.983812689781189} +11/06/2021 21:47:47 - INFO - __main__ - Step 3800: {'lr': 0.000499817738106828, 'samples': 729600, 'steps': 3799, 'loss/train': 5.782630920410156} +11/06/2021 21:47:47 - INFO - __main__ - Step 3801: {'lr': 0.0004998175354493857, 'samples': 729792, 'steps': 3800, 'loss/train': 1.7894034385681152} +11/06/2021 21:47:47 - INFO - __main__ - Step 3802: {'lr': 0.0004998173326793795, 'samples': 729984, 'steps': 3801, 'loss/train': 1.8084430694580078} +11/06/2021 21:47:48 - INFO - __main__ - Step 3803: {'lr': 0.0004998171297968095, 'samples': 730176, 'steps': 3802, 'loss/train': 2.3628175258636475} +11/06/2021 21:47:49 - INFO - __main__ - Step 3804: {'lr': 0.0004998169268016757, 'samples': 730368, 'steps': 3803, 'loss/train': 2.064181089401245} +11/06/2021 21:47:49 - INFO - __main__ - Step 3805: {'lr': 0.0004998167236939783, 'samples': 730560, 'steps': 3804, 'loss/train': 2.378023147583008} +11/06/2021 21:47:50 - INFO - __main__ - Step 3806: {'lr': 0.0004998165204737173, 'samples': 730752, 'steps': 3805, 'loss/train': 1.9755092859268188} +11/06/2021 21:47:50 - INFO - __main__ - Step 3807: {'lr': 0.0004998163171408928, 'samples': 730944, 'steps': 3806, 'loss/train': 2.0892038345336914} +11/06/2021 21:47:50 - INFO - __main__ - Step 3808: {'lr': 0.000499816113695505, 'samples': 731136, 'steps': 3807, 'loss/train': 2.038058042526245} +11/06/2021 21:47:52 - INFO - __main__ - Step 3809: {'lr': 0.0004998159101375538, 'samples': 731328, 'steps': 3808, 'loss/train': 2.4071855545043945} +11/06/2021 21:47:52 - INFO - __main__ - Step 3810: {'lr': 0.0004998157064670395, 'samples': 731520, 'steps': 3809, 'loss/train': 1.957269549369812} +11/06/2021 21:47:52 - INFO - __main__ - Step 3811: {'lr': 0.0004998155026839621, 'samples': 731712, 'steps': 3810, 'loss/train': 1.6153275966644287} +11/06/2021 21:47:53 - INFO - __main__ - Step 3812: {'lr': 0.0004998152987883217, 'samples': 731904, 'steps': 3811, 'loss/train': 1.7951699495315552} +11/06/2021 21:47:53 - INFO - __main__ - Step 3813: {'lr': 0.0004998150947801182, 'samples': 732096, 'steps': 3812, 'loss/train': 1.9503369331359863} +11/06/2021 21:47:54 - INFO - __main__ - Step 3814: {'lr': 0.000499814890659352, 'samples': 732288, 'steps': 3813, 'loss/train': 1.8731478452682495} +11/06/2021 21:47:55 - INFO - __main__ - Step 3815: {'lr': 0.0004998146864260231, 'samples': 732480, 'steps': 3814, 'loss/train': 2.178349733352661} +11/06/2021 21:47:55 - INFO - __main__ - Step 3816: {'lr': 0.0004998144820801316, 'samples': 732672, 'steps': 3815, 'loss/train': 2.257465124130249} +11/06/2021 21:47:55 - INFO - __main__ - Step 3817: {'lr': 0.0004998142776216775, 'samples': 732864, 'steps': 3816, 'loss/train': 2.292968988418579} +11/06/2021 21:47:56 - INFO - __main__ - Step 3818: {'lr': 0.0004998140730506609, 'samples': 733056, 'steps': 3817, 'loss/train': 1.7161427736282349} +11/06/2021 21:47:56 - INFO - __main__ - Step 3819: {'lr': 0.000499813868367082, 'samples': 733248, 'steps': 3818, 'loss/train': 1.899258017539978} +11/06/2021 21:47:57 - INFO - __main__ - Step 3820: {'lr': 0.0004998136635709408, 'samples': 733440, 'steps': 3819, 'loss/train': 2.3737716674804688} +11/06/2021 21:47:57 - INFO - __main__ - Step 3821: {'lr': 0.0004998134586622374, 'samples': 733632, 'steps': 3820, 'loss/train': 2.9889981746673584} +11/06/2021 21:47:58 - INFO - __main__ - Step 3822: {'lr': 0.0004998132536409718, 'samples': 733824, 'steps': 3821, 'loss/train': 1.6760238409042358} +11/06/2021 21:47:58 - INFO - __main__ - Step 3823: {'lr': 0.0004998130485071444, 'samples': 734016, 'steps': 3822, 'loss/train': 2.2223479747772217} +11/06/2021 21:47:58 - INFO - __main__ - Step 3824: {'lr': 0.000499812843260755, 'samples': 734208, 'steps': 3823, 'loss/train': 2.103163480758667} +11/06/2021 21:47:59 - INFO - __main__ - Step 3825: {'lr': 0.0004998126379018038, 'samples': 734400, 'steps': 3824, 'loss/train': 1.4351319074630737} +11/06/2021 21:48:00 - INFO - __main__ - Step 3826: {'lr': 0.000499812432430291, 'samples': 734592, 'steps': 3825, 'loss/train': 2.600419282913208} +11/06/2021 21:48:00 - INFO - __main__ - Step 3827: {'lr': 0.0004998122268462164, 'samples': 734784, 'steps': 3826, 'loss/train': 1.890721082687378} +11/06/2021 21:48:00 - INFO - __main__ - Step 3828: {'lr': 0.0004998120211495803, 'samples': 734976, 'steps': 3827, 'loss/train': 1.8643083572387695} +11/06/2021 21:48:01 - INFO - __main__ - Step 3829: {'lr': 0.0004998118153403827, 'samples': 735168, 'steps': 3828, 'loss/train': 2.375256299972534} +11/06/2021 21:48:02 - INFO - __main__ - Step 3830: {'lr': 0.0004998116094186239, 'samples': 735360, 'steps': 3829, 'loss/train': 1.937308430671692} +11/06/2021 21:48:02 - INFO - __main__ - Step 3831: {'lr': 0.0004998114033843038, 'samples': 735552, 'steps': 3830, 'loss/train': 2.2312798500061035} +11/06/2021 21:48:03 - INFO - __main__ - Step 3832: {'lr': 0.0004998111972374225, 'samples': 735744, 'steps': 3831, 'loss/train': 2.345470905303955} +11/06/2021 21:48:03 - INFO - __main__ - Step 3833: {'lr': 0.0004998109909779801, 'samples': 735936, 'steps': 3832, 'loss/train': 2.126286745071411} +11/06/2021 21:48:03 - INFO - __main__ - Step 3834: {'lr': 0.0004998107846059768, 'samples': 736128, 'steps': 3833, 'loss/train': 2.274366855621338} +11/06/2021 21:48:04 - INFO - __main__ - Step 3835: {'lr': 0.0004998105781214126, 'samples': 736320, 'steps': 3834, 'loss/train': 2.0822598934173584} +11/06/2021 21:48:05 - INFO - __main__ - Step 3836: {'lr': 0.0004998103715242875, 'samples': 736512, 'steps': 3835, 'loss/train': 2.376988649368286} +11/06/2021 21:48:05 - INFO - __main__ - Step 3837: {'lr': 0.0004998101648146018, 'samples': 736704, 'steps': 3836, 'loss/train': 2.1825759410858154} +11/06/2021 21:48:05 - INFO - __main__ - Step 3838: {'lr': 0.0004998099579923555, 'samples': 736896, 'steps': 3837, 'loss/train': 2.2881062030792236} +11/06/2021 21:48:06 - INFO - __main__ - Step 3839: {'lr': 0.0004998097510575487, 'samples': 737088, 'steps': 3838, 'loss/train': 2.04844069480896} +11/06/2021 21:48:06 - INFO - __main__ - Step 3840: {'lr': 0.0004998095440101815, 'samples': 737280, 'steps': 3839, 'loss/train': 2.203437089920044} +11/06/2021 21:48:07 - INFO - __main__ - Step 3841: {'lr': 0.0004998093368502539, 'samples': 737472, 'steps': 3840, 'loss/train': 2.4474103450775146} +11/06/2021 21:48:07 - INFO - __main__ - Step 3842: {'lr': 0.000499809129577766, 'samples': 737664, 'steps': 3841, 'loss/train': 1.3475080728530884} +11/06/2021 21:48:08 - INFO - __main__ - Step 3843: {'lr': 0.0004998089221927182, 'samples': 737856, 'steps': 3842, 'loss/train': 6.6313982009887695} +11/06/2021 21:48:08 - INFO - __main__ - Step 3844: {'lr': 0.0004998087146951101, 'samples': 738048, 'steps': 3843, 'loss/train': 0.9520333409309387} +11/06/2021 21:48:09 - INFO - __main__ - Step 3845: {'lr': 0.0004998085070849422, 'samples': 738240, 'steps': 3844, 'loss/train': 2.355161428451538} +11/06/2021 21:48:09 - INFO - __main__ - Step 3846: {'lr': 0.0004998082993622144, 'samples': 738432, 'steps': 3845, 'loss/train': 1.7078429460525513} +11/06/2021 21:48:10 - INFO - __main__ - Step 3847: {'lr': 0.0004998080915269268, 'samples': 738624, 'steps': 3846, 'loss/train': 1.6196483373641968} +11/06/2021 21:48:10 - INFO - __main__ - Step 3848: {'lr': 0.0004998078835790796, 'samples': 738816, 'steps': 3847, 'loss/train': 1.4258253574371338} +11/06/2021 21:48:11 - INFO - __main__ - Step 3849: {'lr': 0.0004998076755186727, 'samples': 739008, 'steps': 3848, 'loss/train': 1.7136802673339844} +11/06/2021 21:48:11 - INFO - __main__ - Step 3850: {'lr': 0.0004998074673457064, 'samples': 739200, 'steps': 3849, 'loss/train': 2.093299627304077} +11/06/2021 21:48:12 - INFO - __main__ - Step 3851: {'lr': 0.0004998072590601808, 'samples': 739392, 'steps': 3850, 'loss/train': 1.7674520015716553} +11/06/2021 21:48:12 - INFO - __main__ - Step 3852: {'lr': 0.0004998070506620957, 'samples': 739584, 'steps': 3851, 'loss/train': 2.6275033950805664} +11/06/2021 21:48:13 - INFO - __main__ - Step 3853: {'lr': 0.0004998068421514515, 'samples': 739776, 'steps': 3852, 'loss/train': 1.4663965702056885} +11/06/2021 21:48:13 - INFO - __main__ - Step 3854: {'lr': 0.0004998066335282483, 'samples': 739968, 'steps': 3853, 'loss/train': 1.9457613229751587} +11/06/2021 21:48:13 - INFO - __main__ - Step 3855: {'lr': 0.0004998064247924859, 'samples': 740160, 'steps': 3854, 'loss/train': 2.18340802192688} +11/06/2021 21:48:14 - INFO - __main__ - Step 3856: {'lr': 0.0004998062159441648, 'samples': 740352, 'steps': 3855, 'loss/train': 2.0008771419525146} +11/06/2021 21:48:15 - INFO - __main__ - Step 3857: {'lr': 0.0004998060069832846, 'samples': 740544, 'steps': 3856, 'loss/train': 1.8760361671447754} +11/06/2021 21:48:15 - INFO - __main__ - Step 3858: {'lr': 0.0004998057979098459, 'samples': 740736, 'steps': 3857, 'loss/train': 2.1014292240142822} +11/06/2021 21:48:15 - INFO - __main__ - Step 3859: {'lr': 0.0004998055887238485, 'samples': 740928, 'steps': 3858, 'loss/train': 1.7220332622528076} +11/06/2021 21:48:16 - INFO - __main__ - Step 3860: {'lr': 0.0004998053794252925, 'samples': 741120, 'steps': 3859, 'loss/train': 1.1343226432800293} +11/06/2021 21:48:16 - INFO - __main__ - Step 3861: {'lr': 0.0004998051700141781, 'samples': 741312, 'steps': 3860, 'loss/train': 1.9412497282028198} +11/06/2021 21:48:17 - INFO - __main__ - Step 3862: {'lr': 0.0004998049604905052, 'samples': 741504, 'steps': 3861, 'loss/train': 2.0013692378997803} +11/06/2021 21:48:17 - INFO - __main__ - Step 3863: {'lr': 0.0004998047508542742, 'samples': 741696, 'steps': 3862, 'loss/train': 2.296785593032837} +11/06/2021 21:48:18 - INFO - __main__ - Step 3864: {'lr': 0.000499804541105485, 'samples': 741888, 'steps': 3863, 'loss/train': 2.1500766277313232} +11/06/2021 21:48:18 - INFO - __main__ - Step 3865: {'lr': 0.0004998043312441378, 'samples': 742080, 'steps': 3864, 'loss/train': 2.002265214920044} +11/06/2021 21:48:18 - INFO - __main__ - Step 3866: {'lr': 0.0004998041212702325, 'samples': 742272, 'steps': 3865, 'loss/train': 1.9484808444976807} +11/06/2021 21:48:20 - INFO - __main__ - Step 3867: {'lr': 0.0004998039111837694, 'samples': 742464, 'steps': 3866, 'loss/train': 2.214564323425293} +11/06/2021 21:48:20 - INFO - __main__ - Step 3868: {'lr': 0.0004998037009847485, 'samples': 742656, 'steps': 3867, 'loss/train': 2.071249485015869} +11/06/2021 21:48:20 - INFO - __main__ - Step 3869: {'lr': 0.0004998034906731699, 'samples': 742848, 'steps': 3868, 'loss/train': 1.7390302419662476} +11/06/2021 21:48:21 - INFO - __main__ - Step 3870: {'lr': 0.0004998032802490337, 'samples': 743040, 'steps': 3869, 'loss/train': 1.92386794090271} +11/06/2021 21:48:21 - INFO - __main__ - Step 3871: {'lr': 0.0004998030697123399, 'samples': 743232, 'steps': 3870, 'loss/train': 2.0642926692962646} +11/06/2021 21:48:22 - INFO - __main__ - Step 3872: {'lr': 0.0004998028590630887, 'samples': 743424, 'steps': 3871, 'loss/train': 2.2832822799682617} +11/06/2021 21:48:22 - INFO - __main__ - Step 3873: {'lr': 0.0004998026483012803, 'samples': 743616, 'steps': 3872, 'loss/train': 0.3874906599521637} +11/06/2021 21:48:23 - INFO - __main__ - Step 3874: {'lr': 0.0004998024374269147, 'samples': 743808, 'steps': 3873, 'loss/train': 1.9504804611206055} +11/06/2021 21:48:23 - INFO - __main__ - Step 3875: {'lr': 0.000499802226439992, 'samples': 744000, 'steps': 3874, 'loss/train': 1.7076032161712646} +11/06/2021 21:48:23 - INFO - __main__ - Step 3876: {'lr': 0.0004998020153405121, 'samples': 744192, 'steps': 3875, 'loss/train': 2.5436949729919434} +11/06/2021 21:48:25 - INFO - __main__ - Step 3877: {'lr': 0.0004998018041284754, 'samples': 744384, 'steps': 3876, 'loss/train': 1.7179841995239258} +11/06/2021 21:48:25 - INFO - __main__ - Step 3878: {'lr': 0.0004998015928038819, 'samples': 744576, 'steps': 3877, 'loss/train': 1.9025819301605225} +11/06/2021 21:48:25 - INFO - __main__ - Step 3879: {'lr': 0.0004998013813667315, 'samples': 744768, 'steps': 3878, 'loss/train': 6.284189701080322} +11/06/2021 21:48:26 - INFO - __main__ - Step 3880: {'lr': 0.0004998011698170245, 'samples': 744960, 'steps': 3879, 'loss/train': 2.270320415496826} +11/06/2021 21:48:26 - INFO - __main__ - Step 3881: {'lr': 0.000499800958154761, 'samples': 745152, 'steps': 3880, 'loss/train': 1.9726059436798096} +11/06/2021 21:48:27 - INFO - __main__ - Step 3882: {'lr': 0.000499800746379941, 'samples': 745344, 'steps': 3881, 'loss/train': 2.072402000427246} +11/06/2021 21:48:28 - INFO - __main__ - Step 3883: {'lr': 0.0004998005344925647, 'samples': 745536, 'steps': 3882, 'loss/train': 1.0873523950576782} +11/06/2021 21:48:28 - INFO - __main__ - Step 3884: {'lr': 0.0004998003224926321, 'samples': 745728, 'steps': 3883, 'loss/train': 1.970503807067871} +11/06/2021 21:48:29 - INFO - __main__ - Step 3885: {'lr': 0.0004998001103801433, 'samples': 745920, 'steps': 3884, 'loss/train': 2.3565833568573} +11/06/2021 21:48:29 - INFO - __main__ - Step 3886: {'lr': 0.0004997998981550985, 'samples': 746112, 'steps': 3885, 'loss/train': 1.7249259948730469} +11/06/2021 21:48:29 - INFO - __main__ - Step 3887: {'lr': 0.0004997996858174976, 'samples': 746304, 'steps': 3886, 'loss/train': 2.158630132675171} +11/06/2021 21:48:30 - INFO - __main__ - Step 3888: {'lr': 0.0004997994733673409, 'samples': 746496, 'steps': 3887, 'loss/train': 2.0216381549835205} +11/06/2021 21:48:31 - INFO - __main__ - Step 3889: {'lr': 0.0004997992608046283, 'samples': 746688, 'steps': 3888, 'loss/train': 2.1885178089141846} +11/06/2021 21:48:31 - INFO - __main__ - Step 3890: {'lr': 0.0004997990481293602, 'samples': 746880, 'steps': 3889, 'loss/train': 2.567704916000366} +11/06/2021 21:48:31 - INFO - __main__ - Step 3891: {'lr': 0.0004997988353415364, 'samples': 747072, 'steps': 3890, 'loss/train': 2.117457389831543} +11/06/2021 21:48:32 - INFO - __main__ - Step 3892: {'lr': 0.0004997986224411571, 'samples': 747264, 'steps': 3891, 'loss/train': 1.900480031967163} +11/06/2021 21:48:32 - INFO - __main__ - Step 3893: {'lr': 0.0004997984094282224, 'samples': 747456, 'steps': 3892, 'loss/train': 1.8909573554992676} +11/06/2021 21:48:33 - INFO - __main__ - Step 3894: {'lr': 0.0004997981963027324, 'samples': 747648, 'steps': 3893, 'loss/train': 2.2381651401519775} +11/06/2021 21:48:33 - INFO - __main__ - Step 3895: {'lr': 0.0004997979830646871, 'samples': 747840, 'steps': 3894, 'loss/train': 1.9018830060958862} +11/06/2021 21:48:34 - INFO - __main__ - Step 3896: {'lr': 0.0004997977697140868, 'samples': 748032, 'steps': 3895, 'loss/train': 4.09332799911499} +11/06/2021 21:48:34 - INFO - __main__ - Step 3897: {'lr': 0.0004997975562509315, 'samples': 748224, 'steps': 3896, 'loss/train': 1.9882245063781738} +11/06/2021 21:48:34 - INFO - __main__ - Step 3898: {'lr': 0.0004997973426752212, 'samples': 748416, 'steps': 3897, 'loss/train': 2.2893571853637695} +11/06/2021 21:48:35 - INFO - __main__ - Step 3899: {'lr': 0.0004997971289869561, 'samples': 748608, 'steps': 3898, 'loss/train': 2.5305356979370117} +11/06/2021 21:48:36 - INFO - __main__ - Step 3900: {'lr': 0.0004997969151861362, 'samples': 748800, 'steps': 3899, 'loss/train': 1.9628640413284302} +11/06/2021 21:48:36 - INFO - __main__ - Step 3901: {'lr': 0.0004997967012727618, 'samples': 748992, 'steps': 3900, 'loss/train': 1.784785270690918} +11/06/2021 21:48:37 - INFO - __main__ - Step 3902: {'lr': 0.0004997964872468327, 'samples': 749184, 'steps': 3901, 'loss/train': 2.4843428134918213} +11/06/2021 21:48:37 - INFO - __main__ - Step 3903: {'lr': 0.0004997962731083492, 'samples': 749376, 'steps': 3902, 'loss/train': 2.3795173168182373} +11/06/2021 21:48:37 - INFO - __main__ - Step 3904: {'lr': 0.0004997960588573115, 'samples': 749568, 'steps': 3903, 'loss/train': 1.7460960149765015} +11/06/2021 21:48:38 - INFO - __main__ - Step 3905: {'lr': 0.0004997958444937193, 'samples': 749760, 'steps': 3904, 'loss/train': 2.3648343086242676} +11/06/2021 21:48:39 - INFO - __main__ - Step 3906: {'lr': 0.0004997956300175732, 'samples': 749952, 'steps': 3905, 'loss/train': 2.6430604457855225} +11/06/2021 21:48:39 - INFO - __main__ - Step 3907: {'lr': 0.000499795415428873, 'samples': 750144, 'steps': 3906, 'loss/train': 1.1248779296875} +11/06/2021 21:48:39 - INFO - __main__ - Step 3908: {'lr': 0.0004997952007276187, 'samples': 750336, 'steps': 3907, 'loss/train': 1.4855318069458008} +11/06/2021 21:48:40 - INFO - __main__ - Step 3909: {'lr': 0.0004997949859138106, 'samples': 750528, 'steps': 3908, 'loss/train': 2.541107177734375} +11/06/2021 21:48:41 - INFO - __main__ - Step 3910: {'lr': 0.0004997947709874487, 'samples': 750720, 'steps': 3909, 'loss/train': 2.4403843879699707} +11/06/2021 21:48:41 - INFO - __main__ - Step 3911: {'lr': 0.0004997945559485333, 'samples': 750912, 'steps': 3910, 'loss/train': 2.18257212638855} +11/06/2021 21:48:41 - INFO - __main__ - Step 3912: {'lr': 0.0004997943407970642, 'samples': 751104, 'steps': 3911, 'loss/train': 2.1708099842071533} +11/06/2021 21:48:42 - INFO - __main__ - Step 3913: {'lr': 0.0004997941255330416, 'samples': 751296, 'steps': 3912, 'loss/train': 1.9108836650848389} +11/06/2021 21:48:42 - INFO - __main__ - Step 3914: {'lr': 0.0004997939101564656, 'samples': 751488, 'steps': 3913, 'loss/train': 9.35435676574707} +11/06/2021 21:48:43 - INFO - __main__ - Step 3915: {'lr': 0.0004997936946673365, 'samples': 751680, 'steps': 3914, 'loss/train': 1.6310161352157593} +11/06/2021 21:48:44 - INFO - __main__ - Step 3916: {'lr': 0.000499793479065654, 'samples': 751872, 'steps': 3915, 'loss/train': 2.2418010234832764} +11/06/2021 21:48:44 - INFO - __main__ - Step 3917: {'lr': 0.0004997932633514185, 'samples': 752064, 'steps': 3916, 'loss/train': 2.000413417816162} +11/06/2021 21:48:44 - INFO - __main__ - Step 3918: {'lr': 0.00049979304752463, 'samples': 752256, 'steps': 3917, 'loss/train': 1.5085346698760986} +11/06/2021 21:48:45 - INFO - __main__ - Step 3919: {'lr': 0.0004997928315852887, 'samples': 752448, 'steps': 3918, 'loss/train': 2.0506739616394043} +11/06/2021 21:48:46 - INFO - __main__ - Step 3920: {'lr': 0.0004997926155333944, 'samples': 752640, 'steps': 3919, 'loss/train': 1.832281231880188} +11/06/2021 21:48:46 - INFO - __main__ - Step 3921: {'lr': 0.0004997923993689476, 'samples': 752832, 'steps': 3920, 'loss/train': 1.8612034320831299} +11/06/2021 21:48:46 - INFO - __main__ - Step 3922: {'lr': 0.0004997921830919481, 'samples': 753024, 'steps': 3921, 'loss/train': 0.8128635287284851} +11/06/2021 21:48:47 - INFO - __main__ - Step 3923: {'lr': 0.0004997919667023962, 'samples': 753216, 'steps': 3922, 'loss/train': 6.834549903869629} +11/06/2021 21:48:47 - INFO - __main__ - Step 3924: {'lr': 0.0004997917502002917, 'samples': 753408, 'steps': 3923, 'loss/train': 2.564049243927002} +11/06/2021 21:48:47 - INFO - __main__ - Step 3925: {'lr': 0.000499791533585635, 'samples': 753600, 'steps': 3924, 'loss/train': 1.4833868741989136} +11/06/2021 21:48:49 - INFO - __main__ - Step 3926: {'lr': 0.0004997913168584262, 'samples': 753792, 'steps': 3925, 'loss/train': 1.9561244249343872} +11/06/2021 21:48:49 - INFO - __main__ - Step 3927: {'lr': 0.0004997911000186651, 'samples': 753984, 'steps': 3926, 'loss/train': 2.2300021648406982} +11/06/2021 21:48:49 - INFO - __main__ - Step 3928: {'lr': 0.0004997908830663521, 'samples': 754176, 'steps': 3927, 'loss/train': 2.1345834732055664} +11/06/2021 21:48:50 - INFO - __main__ - Step 3929: {'lr': 0.0004997906660014871, 'samples': 754368, 'steps': 3928, 'loss/train': 1.8014755249023438} +11/06/2021 21:48:50 - INFO - __main__ - Step 3930: {'lr': 0.0004997904488240704, 'samples': 754560, 'steps': 3929, 'loss/train': 1.9056246280670166} +11/06/2021 21:48:51 - INFO - __main__ - Step 3931: {'lr': 0.0004997902315341019, 'samples': 754752, 'steps': 3930, 'loss/train': 2.0737431049346924} +11/06/2021 21:48:51 - INFO - __main__ - Step 3932: {'lr': 0.0004997900141315817, 'samples': 754944, 'steps': 3931, 'loss/train': 2.1492855548858643} +11/06/2021 21:48:52 - INFO - __main__ - Step 3933: {'lr': 0.0004997897966165101, 'samples': 755136, 'steps': 3932, 'loss/train': 1.6962233781814575} +11/06/2021 21:48:52 - INFO - __main__ - Step 3934: {'lr': 0.000499789578988887, 'samples': 755328, 'steps': 3933, 'loss/train': 2.532392740249634} +11/06/2021 21:48:52 - INFO - __main__ - Step 3935: {'lr': 0.0004997893612487126, 'samples': 755520, 'steps': 3934, 'loss/train': 2.003080368041992} +11/06/2021 21:48:53 - INFO - __main__ - Step 3936: {'lr': 0.000499789143395987, 'samples': 755712, 'steps': 3935, 'loss/train': 2.3303253650665283} +11/06/2021 21:48:54 - INFO - __main__ - Step 3937: {'lr': 0.0004997889254307103, 'samples': 755904, 'steps': 3936, 'loss/train': 2.4294395446777344} +11/06/2021 21:48:54 - INFO - __main__ - Step 3938: {'lr': 0.0004997887073528825, 'samples': 756096, 'steps': 3937, 'loss/train': 2.0944905281066895} +11/06/2021 21:48:54 - INFO - __main__ - Step 3939: {'lr': 0.0004997884891625037, 'samples': 756288, 'steps': 3938, 'loss/train': 2.200429916381836} +11/06/2021 21:48:55 - INFO - __main__ - Step 3940: {'lr': 0.0004997882708595742, 'samples': 756480, 'steps': 3939, 'loss/train': 1.588007926940918} +11/06/2021 21:48:55 - INFO - __main__ - Step 3941: {'lr': 0.0004997880524440939, 'samples': 756672, 'steps': 3940, 'loss/train': 2.470881700515747} +11/06/2021 21:48:56 - INFO - __main__ - Step 3942: {'lr': 0.0004997878339160628, 'samples': 756864, 'steps': 3941, 'loss/train': 2.125309705734253} +11/06/2021 21:48:56 - INFO - __main__ - Step 3943: {'lr': 0.0004997876152754814, 'samples': 757056, 'steps': 3942, 'loss/train': 1.4756630659103394} +11/06/2021 21:48:57 - INFO - __main__ - Step 3944: {'lr': 0.0004997873965223495, 'samples': 757248, 'steps': 3943, 'loss/train': 2.6807804107666016} +11/06/2021 21:48:57 - INFO - __main__ - Step 3945: {'lr': 0.0004997871776566672, 'samples': 757440, 'steps': 3944, 'loss/train': 2.2836551666259766} +11/06/2021 21:48:58 - INFO - __main__ - Step 3946: {'lr': 0.0004997869586784346, 'samples': 757632, 'steps': 3945, 'loss/train': 2.121295690536499} +11/06/2021 21:48:59 - INFO - __main__ - Step 3947: {'lr': 0.0004997867395876519, 'samples': 757824, 'steps': 3946, 'loss/train': 2.3428549766540527} +11/06/2021 21:48:59 - INFO - __main__ - Step 3948: {'lr': 0.0004997865203843192, 'samples': 758016, 'steps': 3947, 'loss/train': 1.777374267578125} +11/06/2021 21:48:59 - INFO - __main__ - Step 3949: {'lr': 0.0004997863010684365, 'samples': 758208, 'steps': 3948, 'loss/train': 0.35795682668685913} +11/06/2021 21:49:00 - INFO - __main__ - Step 3950: {'lr': 0.0004997860816400039, 'samples': 758400, 'steps': 3949, 'loss/train': 2.5950117111206055} +11/06/2021 21:49:00 - INFO - __main__ - Step 3951: {'lr': 0.0004997858620990217, 'samples': 758592, 'steps': 3950, 'loss/train': 1.9574391841888428} +11/06/2021 21:49:01 - INFO - __main__ - Step 3952: {'lr': 0.0004997856424454897, 'samples': 758784, 'steps': 3951, 'loss/train': 1.4650882482528687} +11/06/2021 21:49:02 - INFO - __main__ - Step 3953: {'lr': 0.0004997854226794082, 'samples': 758976, 'steps': 3952, 'loss/train': 2.324097156524658} +11/06/2021 21:49:02 - INFO - __main__ - Step 3954: {'lr': 0.0004997852028007772, 'samples': 759168, 'steps': 3953, 'loss/train': 1.7094135284423828} +11/06/2021 21:49:02 - INFO - __main__ - Step 3955: {'lr': 0.0004997849828095969, 'samples': 759360, 'steps': 3954, 'loss/train': 2.0461413860321045} +11/06/2021 21:49:03 - INFO - __main__ - Step 3956: {'lr': 0.0004997847627058673, 'samples': 759552, 'steps': 3955, 'loss/train': 1.8901828527450562} +11/06/2021 21:49:04 - INFO - __main__ - Step 3957: {'lr': 0.0004997845424895886, 'samples': 759744, 'steps': 3956, 'loss/train': 2.1595001220703125} +11/06/2021 21:49:04 - INFO - __main__ - Step 3958: {'lr': 0.0004997843221607607, 'samples': 759936, 'steps': 3957, 'loss/train': 2.0419363975524902} +11/06/2021 21:49:04 - INFO - __main__ - Step 3959: {'lr': 0.0004997841017193841, 'samples': 760128, 'steps': 3958, 'loss/train': 2.1688108444213867} +11/06/2021 21:49:05 - INFO - __main__ - Step 3960: {'lr': 0.0004997838811654584, 'samples': 760320, 'steps': 3959, 'loss/train': 2.6631009578704834} +11/06/2021 21:49:05 - INFO - __main__ - Step 3961: {'lr': 0.000499783660498984, 'samples': 760512, 'steps': 3960, 'loss/train': 2.2320704460144043} +11/06/2021 21:49:06 - INFO - __main__ - Step 3962: {'lr': 0.0004997834397199609, 'samples': 760704, 'steps': 3961, 'loss/train': 2.1878163814544678} +11/06/2021 21:49:06 - INFO - __main__ - Step 3963: {'lr': 0.0004997832188283893, 'samples': 760896, 'steps': 3962, 'loss/train': 2.8972058296203613} +11/06/2021 21:49:07 - INFO - __main__ - Step 3964: {'lr': 0.0004997829978242693, 'samples': 761088, 'steps': 3963, 'loss/train': 1.9565014839172363} +11/06/2021 21:49:07 - INFO - __main__ - Step 3965: {'lr': 0.0004997827767076008, 'samples': 761280, 'steps': 3964, 'loss/train': 1.7469931840896606} +11/06/2021 21:49:07 - INFO - __main__ - Step 3966: {'lr': 0.0004997825554783841, 'samples': 761472, 'steps': 3965, 'loss/train': 1.9404348134994507} +11/06/2021 21:49:09 - INFO - __main__ - Step 3967: {'lr': 0.0004997823341366192, 'samples': 761664, 'steps': 3966, 'loss/train': 2.1852457523345947} +11/06/2021 21:49:09 - INFO - __main__ - Step 3968: {'lr': 0.0004997821126823062, 'samples': 761856, 'steps': 3967, 'loss/train': 2.048008680343628} +11/06/2021 21:49:09 - INFO - __main__ - Step 3969: {'lr': 0.0004997818911154454, 'samples': 762048, 'steps': 3968, 'loss/train': 2.4784631729125977} +11/06/2021 21:49:10 - INFO - __main__ - Step 3970: {'lr': 0.0004997816694360367, 'samples': 762240, 'steps': 3969, 'loss/train': 2.501253128051758} +11/06/2021 21:49:10 - INFO - __main__ - Step 3971: {'lr': 0.00049978144764408, 'samples': 762432, 'steps': 3970, 'loss/train': 2.0882301330566406} +11/06/2021 21:49:10 - INFO - __main__ - Step 3972: {'lr': 0.0004997812257395758, 'samples': 762624, 'steps': 3971, 'loss/train': 0.8743030428886414} +11/06/2021 21:49:11 - INFO - __main__ - Step 3973: {'lr': 0.0004997810037225241, 'samples': 762816, 'steps': 3972, 'loss/train': 1.5809043645858765} +11/06/2021 21:49:12 - INFO - __main__ - Step 3974: {'lr': 0.0004997807815929248, 'samples': 763008, 'steps': 3973, 'loss/train': 2.1613574028015137} +11/06/2021 21:49:12 - INFO - __main__ - Step 3975: {'lr': 0.0004997805593507783, 'samples': 763200, 'steps': 3974, 'loss/train': 1.512646198272705} +11/06/2021 21:49:12 - INFO - __main__ - Step 3976: {'lr': 0.0004997803369960844, 'samples': 763392, 'steps': 3975, 'loss/train': 1.4740993976593018} +11/06/2021 21:49:13 - INFO - __main__ - Step 3977: {'lr': 0.0004997801145288433, 'samples': 763584, 'steps': 3976, 'loss/train': 1.5394988059997559} +11/06/2021 21:49:14 - INFO - __main__ - Step 3978: {'lr': 0.0004997798919490553, 'samples': 763776, 'steps': 3977, 'loss/train': 1.7356780767440796} +11/06/2021 21:49:14 - INFO - __main__ - Step 3979: {'lr': 0.0004997796692567202, 'samples': 763968, 'steps': 3978, 'loss/train': 2.2947258949279785} +11/06/2021 21:49:14 - INFO - __main__ - Step 3980: {'lr': 0.0004997794464518383, 'samples': 764160, 'steps': 3979, 'loss/train': 2.025333881378174} +11/06/2021 21:49:15 - INFO - __main__ - Step 3981: {'lr': 0.0004997792235344096, 'samples': 764352, 'steps': 3980, 'loss/train': 2.1326520442962646} +11/06/2021 21:49:15 - INFO - __main__ - Step 3982: {'lr': 0.0004997790005044343, 'samples': 764544, 'steps': 3981, 'loss/train': 1.8855067491531372} +11/06/2021 21:49:16 - INFO - __main__ - Step 3983: {'lr': 0.0004997787773619123, 'samples': 764736, 'steps': 3982, 'loss/train': 2.2183456420898438} +11/06/2021 21:49:17 - INFO - __main__ - Step 3984: {'lr': 0.0004997785541068439, 'samples': 764928, 'steps': 3983, 'loss/train': 2.175524950027466} +11/06/2021 21:49:17 - INFO - __main__ - Step 3985: {'lr': 0.0004997783307392292, 'samples': 765120, 'steps': 3984, 'loss/train': 1.8312244415283203} +11/06/2021 21:49:17 - INFO - __main__ - Step 3986: {'lr': 0.0004997781072590683, 'samples': 765312, 'steps': 3985, 'loss/train': 5.831401348114014} +11/06/2021 21:49:18 - INFO - __main__ - Step 3987: {'lr': 0.000499777883666361, 'samples': 765504, 'steps': 3986, 'loss/train': 2.1856584548950195} +11/06/2021 21:49:19 - INFO - __main__ - Step 3988: {'lr': 0.0004997776599611078, 'samples': 765696, 'steps': 3987, 'loss/train': 1.9828382730484009} +11/06/2021 21:49:19 - INFO - __main__ - Step 3989: {'lr': 0.0004997774361433086, 'samples': 765888, 'steps': 3988, 'loss/train': 2.3569905757904053} +11/06/2021 21:49:19 - INFO - __main__ - Step 3990: {'lr': 0.0004997772122129635, 'samples': 766080, 'steps': 3989, 'loss/train': 1.4840973615646362} +11/06/2021 21:49:20 - INFO - __main__ - Step 3991: {'lr': 0.0004997769881700727, 'samples': 766272, 'steps': 3990, 'loss/train': 2.4721338748931885} +11/06/2021 21:49:20 - INFO - __main__ - Step 3992: {'lr': 0.0004997767640146363, 'samples': 766464, 'steps': 3991, 'loss/train': 1.890811800956726} +11/06/2021 21:49:21 - INFO - __main__ - Step 3993: {'lr': 0.0004997765397466543, 'samples': 766656, 'steps': 3992, 'loss/train': 1.7789920568466187} +11/06/2021 21:49:22 - INFO - __main__ - Step 3994: {'lr': 0.0004997763153661269, 'samples': 766848, 'steps': 3993, 'loss/train': 0.7541496157646179} +11/06/2021 21:49:22 - INFO - __main__ - Step 3995: {'lr': 0.000499776090873054, 'samples': 767040, 'steps': 3994, 'loss/train': 1.7700446844100952} +11/06/2021 21:49:22 - INFO - __main__ - Step 3996: {'lr': 0.000499775866267436, 'samples': 767232, 'steps': 3995, 'loss/train': 2.0774638652801514} +11/06/2021 21:49:23 - INFO - __main__ - Step 3997: {'lr': 0.0004997756415492727, 'samples': 767424, 'steps': 3996, 'loss/train': 2.1475741863250732} +11/06/2021 21:49:23 - INFO - __main__ - Step 3998: {'lr': 0.0004997754167185644, 'samples': 767616, 'steps': 3997, 'loss/train': 2.2139883041381836} +11/06/2021 21:49:24 - INFO - __main__ - Step 3999: {'lr': 0.0004997751917753113, 'samples': 767808, 'steps': 3998, 'loss/train': 1.3149014711380005} +11/06/2021 21:49:24 - INFO - __main__ - Step 4000: {'lr': 0.0004997749667195132, 'samples': 768000, 'steps': 3999, 'loss/train': 2.0716893672943115} +11/06/2021 21:49:25 - INFO - __main__ - Step 4001: {'lr': 0.0004997747415511704, 'samples': 768192, 'steps': 4000, 'loss/train': 2.3865301609039307} +11/06/2021 21:49:25 - INFO - __main__ - Step 4002: {'lr': 0.000499774516270283, 'samples': 768384, 'steps': 4001, 'loss/train': 2.4549617767333984} +11/06/2021 21:49:25 - INFO - __main__ - Step 4003: {'lr': 0.0004997742908768508, 'samples': 768576, 'steps': 4002, 'loss/train': 2.512511968612671} +11/06/2021 21:49:27 - INFO - __main__ - Step 4004: {'lr': 0.0004997740653708744, 'samples': 768768, 'steps': 4003, 'loss/train': 1.9932130575180054} +11/06/2021 21:49:27 - INFO - __main__ - Step 4005: {'lr': 0.0004997738397523537, 'samples': 768960, 'steps': 4004, 'loss/train': 2.0718185901641846} +11/06/2021 21:49:27 - INFO - __main__ - Step 4006: {'lr': 0.0004997736140212887, 'samples': 769152, 'steps': 4005, 'loss/train': 2.311023712158203} +11/06/2021 21:49:28 - INFO - __main__ - Step 4007: {'lr': 0.0004997733881776796, 'samples': 769344, 'steps': 4006, 'loss/train': 2.1917130947113037} +11/06/2021 21:49:28 - INFO - __main__ - Step 4008: {'lr': 0.0004997731622215264, 'samples': 769536, 'steps': 4007, 'loss/train': 2.4064438343048096} +11/06/2021 21:49:29 - INFO - __main__ - Step 4009: {'lr': 0.0004997729361528292, 'samples': 769728, 'steps': 4008, 'loss/train': 2.3731486797332764} +11/06/2021 21:49:29 - INFO - __main__ - Step 4010: {'lr': 0.0004997727099715882, 'samples': 769920, 'steps': 4009, 'loss/train': 1.5370467901229858} +11/06/2021 21:49:30 - INFO - __main__ - Step 4011: {'lr': 0.0004997724836778036, 'samples': 770112, 'steps': 4010, 'loss/train': 1.7078628540039062} +11/06/2021 21:49:30 - INFO - __main__ - Step 4012: {'lr': 0.0004997722572714753, 'samples': 770304, 'steps': 4011, 'loss/train': 1.5252915620803833} +11/06/2021 21:49:30 - INFO - __main__ - Step 4013: {'lr': 0.0004997720307526034, 'samples': 770496, 'steps': 4012, 'loss/train': 2.1763927936553955} +11/06/2021 21:49:31 - INFO - __main__ - Step 4014: {'lr': 0.0004997718041211881, 'samples': 770688, 'steps': 4013, 'loss/train': 2.195366382598877} +11/06/2021 21:49:32 - INFO - __main__ - Step 4015: {'lr': 0.0004997715773772296, 'samples': 770880, 'steps': 4014, 'loss/train': 1.1582077741622925} +11/06/2021 21:49:32 - INFO - __main__ - Step 4016: {'lr': 0.0004997713505207278, 'samples': 771072, 'steps': 4015, 'loss/train': 1.8005876541137695} +11/06/2021 21:49:32 - INFO - __main__ - Step 4017: {'lr': 0.0004997711235516829, 'samples': 771264, 'steps': 4016, 'loss/train': 1.86122727394104} +11/06/2021 21:49:33 - INFO - __main__ - Step 4018: {'lr': 0.000499770896470095, 'samples': 771456, 'steps': 4017, 'loss/train': 1.915101170539856} +11/06/2021 21:49:34 - INFO - __main__ - Step 4019: {'lr': 0.0004997706692759642, 'samples': 771648, 'steps': 4018, 'loss/train': 2.1200358867645264} +11/06/2021 21:49:34 - INFO - __main__ - Step 4020: {'lr': 0.0004997704419692905, 'samples': 771840, 'steps': 4019, 'loss/train': 2.1703789234161377} +11/06/2021 21:49:34 - INFO - __main__ - Step 4021: {'lr': 0.0004997702145500741, 'samples': 772032, 'steps': 4020, 'loss/train': 2.4524030685424805} +11/06/2021 21:49:35 - INFO - __main__ - Step 4022: {'lr': 0.0004997699870183151, 'samples': 772224, 'steps': 4021, 'loss/train': 2.2087340354919434} +11/06/2021 21:49:35 - INFO - __main__ - Step 4023: {'lr': 0.0004997697593740137, 'samples': 772416, 'steps': 4022, 'loss/train': 1.8903212547302246} +11/06/2021 21:49:36 - INFO - __main__ - Step 4024: {'lr': 0.0004997695316171698, 'samples': 772608, 'steps': 4023, 'loss/train': 2.31099534034729} +11/06/2021 21:49:37 - INFO - __main__ - Step 4025: {'lr': 0.0004997693037477837, 'samples': 772800, 'steps': 4024, 'loss/train': 2.07493257522583} +11/06/2021 21:49:37 - INFO - __main__ - Step 4026: {'lr': 0.0004997690757658552, 'samples': 772992, 'steps': 4025, 'loss/train': 1.9826215505599976} +11/06/2021 21:49:37 - INFO - __main__ - Step 4027: {'lr': 0.0004997688476713848, 'samples': 773184, 'steps': 4026, 'loss/train': 2.102391004562378} +11/06/2021 21:49:38 - INFO - __main__ - Step 4028: {'lr': 0.0004997686194643724, 'samples': 773376, 'steps': 4027, 'loss/train': 1.9948838949203491} +11/06/2021 21:49:38 - INFO - __main__ - Step 4029: {'lr': 0.0004997683911448181, 'samples': 773568, 'steps': 4028, 'loss/train': 1.7805095911026} +11/06/2021 21:49:39 - INFO - __main__ - Step 4030: {'lr': 0.000499768162712722, 'samples': 773760, 'steps': 4029, 'loss/train': 2.1849615573883057} +11/06/2021 21:49:39 - INFO - __main__ - Step 4031: {'lr': 0.0004997679341680843, 'samples': 773952, 'steps': 4030, 'loss/train': 2.313040256500244} +11/06/2021 21:49:40 - INFO - __main__ - Step 4032: {'lr': 0.0004997677055109049, 'samples': 774144, 'steps': 4031, 'loss/train': 1.893852949142456} +11/06/2021 21:49:40 - INFO - __main__ - Step 4033: {'lr': 0.0004997674767411841, 'samples': 774336, 'steps': 4032, 'loss/train': 2.130466938018799} +11/06/2021 21:49:40 - INFO - __main__ - Step 4034: {'lr': 0.0004997672478589219, 'samples': 774528, 'steps': 4033, 'loss/train': 1.615881085395813} +11/06/2021 21:49:41 - INFO - __main__ - Step 4035: {'lr': 0.0004997670188641183, 'samples': 774720, 'steps': 4034, 'loss/train': 2.1269845962524414} +11/06/2021 21:49:42 - INFO - __main__ - Step 4036: {'lr': 0.0004997667897567738, 'samples': 774912, 'steps': 4035, 'loss/train': 2.2043027877807617} +11/06/2021 21:49:42 - INFO - __main__ - Step 4037: {'lr': 0.0004997665605368881, 'samples': 775104, 'steps': 4036, 'loss/train': 1.7043681144714355} +11/06/2021 21:49:42 - INFO - __main__ - Step 4038: {'lr': 0.0004997663312044614, 'samples': 775296, 'steps': 4037, 'loss/train': 1.8073010444641113} +11/06/2021 21:49:43 - INFO - __main__ - Step 4039: {'lr': 0.0004997661017594939, 'samples': 775488, 'steps': 4038, 'loss/train': 2.2743730545043945} +11/06/2021 21:49:44 - INFO - __main__ - Step 4040: {'lr': 0.0004997658722019857, 'samples': 775680, 'steps': 4039, 'loss/train': 1.5168383121490479} +11/06/2021 21:49:44 - INFO - __main__ - Step 4041: {'lr': 0.0004997656425319367, 'samples': 775872, 'steps': 4040, 'loss/train': 2.3586344718933105} +11/06/2021 21:49:44 - INFO - __main__ - Step 4042: {'lr': 0.0004997654127493473, 'samples': 776064, 'steps': 4041, 'loss/train': 2.290358066558838} +11/06/2021 21:49:45 - INFO - __main__ - Step 4043: {'lr': 0.0004997651828542173, 'samples': 776256, 'steps': 4042, 'loss/train': 2.349440336227417} +11/06/2021 21:49:45 - INFO - __main__ - Step 4044: {'lr': 0.0004997649528465471, 'samples': 776448, 'steps': 4043, 'loss/train': 2.3541646003723145} +11/06/2021 21:49:46 - INFO - __main__ - Step 4045: {'lr': 0.0004997647227263367, 'samples': 776640, 'steps': 4044, 'loss/train': 2.01802396774292} +11/06/2021 21:49:47 - INFO - __main__ - Step 4046: {'lr': 0.000499764492493586, 'samples': 776832, 'steps': 4045, 'loss/train': 1.9747871160507202} +11/06/2021 21:49:47 - INFO - __main__ - Step 4047: {'lr': 0.0004997642621482955, 'samples': 777024, 'steps': 4046, 'loss/train': 3.536803960800171} +11/06/2021 21:49:47 - INFO - __main__ - Step 4048: {'lr': 0.0004997640316904649, 'samples': 777216, 'steps': 4047, 'loss/train': 2.313307523727417} +11/06/2021 21:49:48 - INFO - __main__ - Step 4049: {'lr': 0.0004997638011200946, 'samples': 777408, 'steps': 4048, 'loss/train': 1.8340681791305542} +11/06/2021 21:49:49 - INFO - __main__ - Step 4050: {'lr': 0.0004997635704371844, 'samples': 777600, 'steps': 4049, 'loss/train': 2.015902519226074} +11/06/2021 21:49:49 - INFO - __main__ - Step 4051: {'lr': 0.0004997633396417348, 'samples': 777792, 'steps': 4050, 'loss/train': 2.1511425971984863} +11/06/2021 21:49:49 - INFO - __main__ - Step 4052: {'lr': 0.0004997631087337456, 'samples': 777984, 'steps': 4051, 'loss/train': 1.9303054809570312} +11/06/2021 21:49:50 - INFO - __main__ - Step 4053: {'lr': 0.000499762877713217, 'samples': 778176, 'steps': 4052, 'loss/train': 2.202286720275879} +11/06/2021 21:49:50 - INFO - __main__ - Step 4054: {'lr': 0.0004997626465801492, 'samples': 778368, 'steps': 4053, 'loss/train': 2.0874695777893066} +11/06/2021 21:49:51 - INFO - __main__ - Step 4055: {'lr': 0.000499762415334542, 'samples': 778560, 'steps': 4054, 'loss/train': 1.871009111404419} +11/06/2021 21:49:51 - INFO - __main__ - Step 4056: {'lr': 0.0004997621839763958, 'samples': 778752, 'steps': 4055, 'loss/train': 1.8566710948944092} +11/06/2021 21:49:52 - INFO - __main__ - Step 4057: {'lr': 0.0004997619525057106, 'samples': 778944, 'steps': 4056, 'loss/train': 1.2701704502105713} +11/06/2021 21:49:52 - INFO - __main__ - Step 4058: {'lr': 0.0004997617209224866, 'samples': 779136, 'steps': 4057, 'loss/train': 2.2687175273895264} +11/06/2021 21:49:52 - INFO - __main__ - Step 4059: {'lr': 0.0004997614892267238, 'samples': 779328, 'steps': 4058, 'loss/train': 1.7731740474700928} +11/06/2021 21:49:53 - INFO - __main__ - Step 4060: {'lr': 0.0004997612574184223, 'samples': 779520, 'steps': 4059, 'loss/train': 2.616718292236328} +11/06/2021 21:49:54 - INFO - __main__ - Step 4061: {'lr': 0.0004997610254975823, 'samples': 779712, 'steps': 4060, 'loss/train': 1.441390872001648} +11/06/2021 21:49:54 - INFO - __main__ - Step 4062: {'lr': 0.0004997607934642038, 'samples': 779904, 'steps': 4061, 'loss/train': 2.379161834716797} +11/06/2021 21:49:55 - INFO - __main__ - Step 4063: {'lr': 0.0004997605613182868, 'samples': 780096, 'steps': 4062, 'loss/train': 2.2010395526885986} +11/06/2021 21:49:55 - INFO - __main__ - Step 4064: {'lr': 0.0004997603290598317, 'samples': 780288, 'steps': 4063, 'loss/train': 1.8180835247039795} +11/06/2021 21:49:55 - INFO - __main__ - Step 4065: {'lr': 0.0004997600966888384, 'samples': 780480, 'steps': 4064, 'loss/train': 1.5754492282867432} +11/06/2021 21:49:56 - INFO - __main__ - Step 4066: {'lr': 0.000499759864205307, 'samples': 780672, 'steps': 4065, 'loss/train': 1.9471435546875} +11/06/2021 21:49:57 - INFO - __main__ - Step 4067: {'lr': 0.0004997596316092378, 'samples': 780864, 'steps': 4066, 'loss/train': 0.3540392220020294} +11/06/2021 21:49:57 - INFO - __main__ - Step 4068: {'lr': 0.0004997593989006306, 'samples': 781056, 'steps': 4067, 'loss/train': 1.7563910484313965} +11/06/2021 21:49:58 - INFO - __main__ - Step 4069: {'lr': 0.0004997591660794858, 'samples': 781248, 'steps': 4068, 'loss/train': 2.3376967906951904} +11/06/2021 21:49:58 - INFO - __main__ - Step 4070: {'lr': 0.0004997589331458034, 'samples': 781440, 'steps': 4069, 'loss/train': 2.6819803714752197} +11/06/2021 21:49:59 - INFO - __main__ - Step 4071: {'lr': 0.0004997587000995833, 'samples': 781632, 'steps': 4070, 'loss/train': 2.0289735794067383} +11/06/2021 21:49:59 - INFO - __main__ - Step 4072: {'lr': 0.000499758466940826, 'samples': 781824, 'steps': 4071, 'loss/train': 1.8696802854537964} +11/06/2021 21:50:00 - INFO - __main__ - Step 4073: {'lr': 0.0004997582336695312, 'samples': 782016, 'steps': 4072, 'loss/train': 2.1343019008636475} +11/06/2021 21:50:00 - INFO - __main__ - Step 4074: {'lr': 0.0004997580002856993, 'samples': 782208, 'steps': 4073, 'loss/train': 2.6347973346710205} +11/06/2021 21:50:00 - INFO - __main__ - Step 4075: {'lr': 0.0004997577667893303, 'samples': 782400, 'steps': 4074, 'loss/train': 2.238234519958496} +11/06/2021 21:50:01 - INFO - __main__ - Step 4076: {'lr': 0.0004997575331804243, 'samples': 782592, 'steps': 4075, 'loss/train': 1.6434662342071533} +11/06/2021 21:50:02 - INFO - __main__ - Step 4077: {'lr': 0.0004997572994589812, 'samples': 782784, 'steps': 4076, 'loss/train': 2.2874550819396973} +11/06/2021 21:50:02 - INFO - __main__ - Step 4078: {'lr': 0.0004997570656250016, 'samples': 782976, 'steps': 4077, 'loss/train': 2.18599009513855} +11/06/2021 21:50:02 - INFO - __main__ - Step 4079: {'lr': 0.0004997568316784852, 'samples': 783168, 'steps': 4078, 'loss/train': 2.6030142307281494} +11/06/2021 21:50:03 - INFO - __main__ - Step 4080: {'lr': 0.0004997565976194323, 'samples': 783360, 'steps': 4079, 'loss/train': 2.873201608657837} +11/06/2021 21:50:03 - INFO - __main__ - Step 4081: {'lr': 0.0004997563634478429, 'samples': 783552, 'steps': 4080, 'loss/train': 1.6083195209503174} +11/06/2021 21:50:04 - INFO - __main__ - Step 4082: {'lr': 0.000499756129163717, 'samples': 783744, 'steps': 4081, 'loss/train': 2.6470818519592285} +11/06/2021 21:50:05 - INFO - __main__ - Step 4083: {'lr': 0.000499755894767055, 'samples': 783936, 'steps': 4082, 'loss/train': 2.0863211154937744} +11/06/2021 21:50:05 - INFO - __main__ - Step 4084: {'lr': 0.0004997556602578568, 'samples': 784128, 'steps': 4083, 'loss/train': 2.274592161178589} +11/06/2021 21:50:05 - INFO - __main__ - Step 4085: {'lr': 0.0004997554256361225, 'samples': 784320, 'steps': 4084, 'loss/train': 1.7604327201843262} +11/06/2021 21:50:06 - INFO - __main__ - Step 4086: {'lr': 0.0004997551909018524, 'samples': 784512, 'steps': 4085, 'loss/train': 1.6476736068725586} +11/06/2021 21:50:07 - INFO - __main__ - Step 4087: {'lr': 0.0004997549560550464, 'samples': 784704, 'steps': 4086, 'loss/train': 2.3296737670898438} +11/06/2021 21:50:07 - INFO - __main__ - Step 4088: {'lr': 0.0004997547210957047, 'samples': 784896, 'steps': 4087, 'loss/train': 1.9330281019210815} +11/06/2021 21:50:07 - INFO - __main__ - Step 4089: {'lr': 0.0004997544860238272, 'samples': 785088, 'steps': 4088, 'loss/train': 2.002901315689087} +11/06/2021 21:50:08 - INFO - __main__ - Step 4090: {'lr': 0.0004997542508394144, 'samples': 785280, 'steps': 4089, 'loss/train': 2.227198362350464} +11/06/2021 21:50:08 - INFO - __main__ - Step 4091: {'lr': 0.000499754015542466, 'samples': 785472, 'steps': 4090, 'loss/train': 2.175802707672119} +11/06/2021 21:50:09 - INFO - __main__ - Step 4092: {'lr': 0.0004997537801329824, 'samples': 785664, 'steps': 4091, 'loss/train': 1.697835087776184} +11/06/2021 21:50:10 - INFO - __main__ - Step 4093: {'lr': 0.0004997535446109637, 'samples': 785856, 'steps': 4092, 'loss/train': 1.8053069114685059} +11/06/2021 21:50:10 - INFO - __main__ - Step 4094: {'lr': 0.0004997533089764097, 'samples': 786048, 'steps': 4093, 'loss/train': 1.4036602973937988} +11/06/2021 21:50:10 - INFO - __main__ - Step 4095: {'lr': 0.0004997530732293209, 'samples': 786240, 'steps': 4094, 'loss/train': 1.8951164484024048} +11/06/2021 21:50:11 - INFO - __main__ - Step 4096: {'lr': 0.000499752837369697, 'samples': 786432, 'steps': 4095, 'loss/train': 2.195209264755249} +11/06/2021 21:50:12 - INFO - __main__ - Step 4097: {'lr': 0.0004997526013975385, 'samples': 786624, 'steps': 4096, 'loss/train': 1.7116293907165527} +11/06/2021 21:50:12 - INFO - __main__ - Step 4098: {'lr': 0.0004997523653128453, 'samples': 786816, 'steps': 4097, 'loss/train': 1.4756605625152588} +11/06/2021 21:50:12 - INFO - __main__ - Step 4099: {'lr': 0.0004997521291156175, 'samples': 787008, 'steps': 4098, 'loss/train': 2.56708025932312} +11/06/2021 21:50:13 - INFO - __main__ - Step 4100: {'lr': 0.0004997518928058553, 'samples': 787200, 'steps': 4099, 'loss/train': 1.9039506912231445} +11/06/2021 21:50:13 - INFO - __main__ - Step 4101: {'lr': 0.0004997516563835587, 'samples': 787392, 'steps': 4100, 'loss/train': 2.242305040359497} +11/06/2021 21:50:14 - INFO - __main__ - Step 4102: {'lr': 0.0004997514198487279, 'samples': 787584, 'steps': 4101, 'loss/train': 1.7869306802749634} +11/06/2021 21:50:15 - INFO - __main__ - Step 4103: {'lr': 0.0004997511832013629, 'samples': 787776, 'steps': 4102, 'loss/train': 1.4681452512741089} +11/06/2021 21:50:15 - INFO - __main__ - Step 4104: {'lr': 0.0004997509464414639, 'samples': 787968, 'steps': 4103, 'loss/train': 1.8288829326629639} +11/06/2021 21:50:15 - INFO - __main__ - Step 4105: {'lr': 0.000499750709569031, 'samples': 788160, 'steps': 4104, 'loss/train': 2.145322322845459} +11/06/2021 21:50:16 - INFO - __main__ - Step 4106: {'lr': 0.0004997504725840644, 'samples': 788352, 'steps': 4105, 'loss/train': 1.8525432348251343} +11/06/2021 21:50:17 - INFO - __main__ - Step 4107: {'lr': 0.0004997502354865639, 'samples': 788544, 'steps': 4106, 'loss/train': 2.4128339290618896} +11/06/2021 21:50:17 - INFO - __main__ - Step 4108: {'lr': 0.0004997499982765299, 'samples': 788736, 'steps': 4107, 'loss/train': 2.3028995990753174} +11/06/2021 21:50:17 - INFO - __main__ - Step 4109: {'lr': 0.0004997497609539623, 'samples': 788928, 'steps': 4108, 'loss/train': 1.7529590129852295} +11/06/2021 21:50:18 - INFO - __main__ - Step 4110: {'lr': 0.0004997495235188614, 'samples': 789120, 'steps': 4109, 'loss/train': 2.2879607677459717} +11/06/2021 21:50:18 - INFO - __main__ - Step 4111: {'lr': 0.0004997492859712272, 'samples': 789312, 'steps': 4110, 'loss/train': 2.290275812149048} +11/06/2021 21:50:19 - INFO - __main__ - Step 4112: {'lr': 0.0004997490483110599, 'samples': 789504, 'steps': 4111, 'loss/train': 2.2251839637756348} +11/06/2021 21:50:19 - INFO - __main__ - Step 4113: {'lr': 0.0004997488105383594, 'samples': 789696, 'steps': 4112, 'loss/train': 1.8223003149032593} +11/06/2021 21:50:20 - INFO - __main__ - Step 4114: {'lr': 0.000499748572653126, 'samples': 789888, 'steps': 4113, 'loss/train': 2.5275418758392334} +11/06/2021 21:50:20 - INFO - __main__ - Step 4115: {'lr': 0.0004997483346553597, 'samples': 790080, 'steps': 4114, 'loss/train': 2.204193592071533} +11/06/2021 21:50:21 - INFO - __main__ - Step 4116: {'lr': 0.0004997480965450607, 'samples': 790272, 'steps': 4115, 'loss/train': 2.2369582653045654} +11/06/2021 21:50:21 - INFO - __main__ - Step 4117: {'lr': 0.0004997478583222291, 'samples': 790464, 'steps': 4116, 'loss/train': 1.5711380243301392} +11/06/2021 21:50:22 - INFO - __main__ - Step 4118: {'lr': 0.0004997476199868649, 'samples': 790656, 'steps': 4117, 'loss/train': 2.431384563446045} +11/06/2021 21:50:22 - INFO - __main__ - Step 4119: {'lr': 0.0004997473815389683, 'samples': 790848, 'steps': 4118, 'loss/train': 2.284108877182007} +11/06/2021 21:50:23 - INFO - __main__ - Step 4120: {'lr': 0.0004997471429785394, 'samples': 791040, 'steps': 4119, 'loss/train': 2.340329170227051} +11/06/2021 21:50:23 - INFO - __main__ - Step 4121: {'lr': 0.0004997469043055784, 'samples': 791232, 'steps': 4120, 'loss/train': 1.350162386894226} +11/06/2021 21:50:24 - INFO - __main__ - Step 4122: {'lr': 0.000499746665520085, 'samples': 791424, 'steps': 4121, 'loss/train': 2.2945504188537598} +11/06/2021 21:50:24 - INFO - __main__ - Step 4123: {'lr': 0.0004997464266220599, 'samples': 791616, 'steps': 4122, 'loss/train': 1.9403982162475586} +11/06/2021 21:50:25 - INFO - __main__ - Step 4124: {'lr': 0.0004997461876115029, 'samples': 791808, 'steps': 4123, 'loss/train': 1.7669719457626343} +11/06/2021 21:50:25 - INFO - __main__ - Step 4125: {'lr': 0.0004997459484884139, 'samples': 792000, 'steps': 4124, 'loss/train': 2.5181665420532227} +11/06/2021 21:50:25 - INFO - __main__ - Step 4126: {'lr': 0.0004997457092527934, 'samples': 792192, 'steps': 4125, 'loss/train': 1.4069466590881348} +11/06/2021 21:50:26 - INFO - __main__ - Step 4127: {'lr': 0.0004997454699046412, 'samples': 792384, 'steps': 4126, 'loss/train': 1.1352291107177734} +11/06/2021 21:50:27 - INFO - __main__ - Step 4128: {'lr': 0.0004997452304439577, 'samples': 792576, 'steps': 4127, 'loss/train': 2.2297260761260986} +11/06/2021 21:50:27 - INFO - __main__ - Step 4129: {'lr': 0.0004997449908707428, 'samples': 792768, 'steps': 4128, 'loss/train': 1.6142773628234863} +11/06/2021 21:50:27 - INFO - __main__ - Step 4130: {'lr': 0.0004997447511849966, 'samples': 792960, 'steps': 4129, 'loss/train': 0.43251675367355347} +11/06/2021 21:50:28 - INFO - __main__ - Step 4131: {'lr': 0.0004997445113867193, 'samples': 793152, 'steps': 4130, 'loss/train': 2.1551005840301514} +11/06/2021 21:50:28 - INFO - __main__ - Step 4132: {'lr': 0.000499744271475911, 'samples': 793344, 'steps': 4131, 'loss/train': 1.9457584619522095} +11/06/2021 21:50:29 - INFO - __main__ - Step 4133: {'lr': 0.0004997440314525718, 'samples': 793536, 'steps': 4132, 'loss/train': 1.7447444200515747} +11/06/2021 21:50:29 - INFO - __main__ - Step 4134: {'lr': 0.0004997437913167018, 'samples': 793728, 'steps': 4133, 'loss/train': 2.1197428703308105} +11/06/2021 21:50:30 - INFO - __main__ - Step 4135: {'lr': 0.0004997435510683011, 'samples': 793920, 'steps': 4134, 'loss/train': 1.950053095817566} +11/06/2021 21:50:30 - INFO - __main__ - Step 4136: {'lr': 0.0004997433107073697, 'samples': 794112, 'steps': 4135, 'loss/train': 2.236959457397461} +11/06/2021 21:50:30 - INFO - __main__ - Step 4137: {'lr': 0.000499743070233908, 'samples': 794304, 'steps': 4136, 'loss/train': 2.2369892597198486} +11/06/2021 21:50:31 - INFO - __main__ - Step 4138: {'lr': 0.0004997428296479158, 'samples': 794496, 'steps': 4137, 'loss/train': 1.6959571838378906} +11/06/2021 21:50:32 - INFO - __main__ - Step 4139: {'lr': 0.0004997425889493933, 'samples': 794688, 'steps': 4138, 'loss/train': 2.1793487071990967} +11/06/2021 21:50:32 - INFO - __main__ - Step 4140: {'lr': 0.0004997423481383407, 'samples': 794880, 'steps': 4139, 'loss/train': 1.875229001045227} +11/06/2021 21:50:33 - INFO - __main__ - Step 4141: {'lr': 0.0004997421072147581, 'samples': 795072, 'steps': 4140, 'loss/train': 2.0105512142181396} +11/06/2021 21:50:33 - INFO - __main__ - Step 4142: {'lr': 0.0004997418661786455, 'samples': 795264, 'steps': 4141, 'loss/train': 2.1727404594421387} +11/06/2021 21:50:34 - INFO - __main__ - Step 4143: {'lr': 0.0004997416250300031, 'samples': 795456, 'steps': 4142, 'loss/train': 2.191661834716797} +11/06/2021 21:50:34 - INFO - __main__ - Step 4144: {'lr': 0.0004997413837688309, 'samples': 795648, 'steps': 4143, 'loss/train': 1.4901235103607178} +11/06/2021 21:50:35 - INFO - __main__ - Step 4145: {'lr': 0.0004997411423951292, 'samples': 795840, 'steps': 4144, 'loss/train': 2.327420234680176} +11/06/2021 21:50:35 - INFO - __main__ - Step 4146: {'lr': 0.0004997409009088979, 'samples': 796032, 'steps': 4145, 'loss/train': 2.225456476211548} +11/06/2021 21:50:35 - INFO - __main__ - Step 4147: {'lr': 0.0004997406593101373, 'samples': 796224, 'steps': 4146, 'loss/train': 1.6128720045089722} +11/06/2021 21:50:36 - INFO - __main__ - Step 4148: {'lr': 0.0004997404175988474, 'samples': 796416, 'steps': 4147, 'loss/train': 1.3797961473464966} +11/06/2021 21:50:37 - INFO - __main__ - Step 4149: {'lr': 0.0004997401757750282, 'samples': 796608, 'steps': 4148, 'loss/train': 2.3454394340515137} +11/06/2021 21:50:37 - INFO - __main__ - Step 4150: {'lr': 0.00049973993383868, 'samples': 796800, 'steps': 4149, 'loss/train': 1.4798073768615723} +11/06/2021 21:50:37 - INFO - __main__ - Step 4151: {'lr': 0.0004997396917898029, 'samples': 796992, 'steps': 4150, 'loss/train': 1.8693385124206543} +11/06/2021 21:50:38 - INFO - __main__ - Step 4152: {'lr': 0.0004997394496283969, 'samples': 797184, 'steps': 4151, 'loss/train': 1.895919919013977} +11/06/2021 21:50:39 - INFO - __main__ - Step 4153: {'lr': 0.0004997392073544622, 'samples': 797376, 'steps': 4152, 'loss/train': 2.0135254859924316} +11/06/2021 21:50:39 - INFO - __main__ - Step 4154: {'lr': 0.0004997389649679987, 'samples': 797568, 'steps': 4153, 'loss/train': 1.9823795557022095} +11/06/2021 21:50:39 - INFO - __main__ - Step 4155: {'lr': 0.0004997387224690068, 'samples': 797760, 'steps': 4154, 'loss/train': 2.079752206802368} +11/06/2021 21:50:40 - INFO - __main__ - Step 4156: {'lr': 0.0004997384798574865, 'samples': 797952, 'steps': 4155, 'loss/train': 1.7831960916519165} +11/06/2021 21:50:40 - INFO - __main__ - Step 4157: {'lr': 0.0004997382371334379, 'samples': 798144, 'steps': 4156, 'loss/train': 1.613570213317871} +11/06/2021 21:50:41 - INFO - __main__ - Step 4158: {'lr': 0.0004997379942968611, 'samples': 798336, 'steps': 4157, 'loss/train': 2.2602744102478027} +11/06/2021 21:50:41 - INFO - __main__ - Step 4159: {'lr': 0.0004997377513477562, 'samples': 798528, 'steps': 4158, 'loss/train': 1.372780203819275} +11/06/2021 21:50:42 - INFO - __main__ - Step 4160: {'lr': 0.0004997375082861234, 'samples': 798720, 'steps': 4159, 'loss/train': 0.5014187693595886} +11/06/2021 21:50:42 - INFO - __main__ - Step 4161: {'lr': 0.0004997372651119626, 'samples': 798912, 'steps': 4160, 'loss/train': 2.1681416034698486} +11/06/2021 21:50:42 - INFO - __main__ - Step 4162: {'lr': 0.0004997370218252741, 'samples': 799104, 'steps': 4161, 'loss/train': 1.6607433557510376} +11/06/2021 21:50:44 - INFO - __main__ - Step 4163: {'lr': 0.000499736778426058, 'samples': 799296, 'steps': 4162, 'loss/train': 1.9761664867401123} +11/06/2021 21:50:44 - INFO - __main__ - Step 4164: {'lr': 0.0004997365349143142, 'samples': 799488, 'steps': 4163, 'loss/train': 2.0288639068603516} +11/06/2021 21:50:44 - INFO - __main__ - Step 4165: {'lr': 0.0004997362912900432, 'samples': 799680, 'steps': 4164, 'loss/train': 2.2376766204833984} +11/06/2021 21:50:45 - INFO - __main__ - Step 4166: {'lr': 0.0004997360475532447, 'samples': 799872, 'steps': 4165, 'loss/train': 2.014327049255371} +11/06/2021 21:50:45 - INFO - __main__ - Step 4167: {'lr': 0.000499735803703919, 'samples': 800064, 'steps': 4166, 'loss/train': 2.371185302734375} +11/06/2021 21:50:46 - INFO - __main__ - Step 4168: {'lr': 0.0004997355597420663, 'samples': 800256, 'steps': 4167, 'loss/train': 1.7514441013336182} +11/06/2021 21:50:46 - INFO - __main__ - Step 4169: {'lr': 0.0004997353156676866, 'samples': 800448, 'steps': 4168, 'loss/train': 2.4108896255493164} +11/06/2021 21:50:47 - INFO - __main__ - Step 4170: {'lr': 0.0004997350714807799, 'samples': 800640, 'steps': 4169, 'loss/train': 1.9724844694137573} +11/06/2021 21:50:47 - INFO - __main__ - Step 4171: {'lr': 0.0004997348271813466, 'samples': 800832, 'steps': 4170, 'loss/train': 2.2488949298858643} +11/06/2021 21:50:47 - INFO - __main__ - Step 4172: {'lr': 0.0004997345827693865, 'samples': 801024, 'steps': 4171, 'loss/train': 2.0820884704589844} +11/06/2021 21:50:48 - INFO - __main__ - Step 4173: {'lr': 0.0004997343382448999, 'samples': 801216, 'steps': 4172, 'loss/train': 1.9005787372589111} +11/06/2021 21:50:49 - INFO - __main__ - Step 4174: {'lr': 0.0004997340936078869, 'samples': 801408, 'steps': 4173, 'loss/train': 2.1329050064086914} +11/06/2021 21:50:49 - INFO - __main__ - Step 4175: {'lr': 0.0004997338488583475, 'samples': 801600, 'steps': 4174, 'loss/train': 2.015869617462158} +11/06/2021 21:50:50 - INFO - __main__ - Step 4176: {'lr': 0.000499733603996282, 'samples': 801792, 'steps': 4175, 'loss/train': 1.6287065744400024} +11/06/2021 21:50:50 - INFO - __main__ - Step 4177: {'lr': 0.0004997333590216902, 'samples': 801984, 'steps': 4176, 'loss/train': 2.286756753921509} +11/06/2021 21:50:50 - INFO - __main__ - Step 4178: {'lr': 0.0004997331139345725, 'samples': 802176, 'steps': 4177, 'loss/train': 2.0928821563720703} +11/06/2021 21:50:51 - INFO - __main__ - Step 4179: {'lr': 0.000499732868734929, 'samples': 802368, 'steps': 4178, 'loss/train': 1.4197605848312378} +11/06/2021 21:50:52 - INFO - __main__ - Step 4180: {'lr': 0.0004997326234227596, 'samples': 802560, 'steps': 4179, 'loss/train': 1.9068725109100342} +11/06/2021 21:50:52 - INFO - __main__ - Step 4181: {'lr': 0.0004997323779980646, 'samples': 802752, 'steps': 4180, 'loss/train': 0.9633380174636841} +11/06/2021 21:50:52 - INFO - __main__ - Step 4182: {'lr': 0.0004997321324608441, 'samples': 802944, 'steps': 4181, 'loss/train': 2.2076642513275146} +11/06/2021 21:50:53 - INFO - __main__ - Step 4183: {'lr': 0.0004997318868110981, 'samples': 803136, 'steps': 4182, 'loss/train': 2.6250104904174805} +11/06/2021 21:50:54 - INFO - __main__ - Step 4184: {'lr': 0.0004997316410488267, 'samples': 803328, 'steps': 4183, 'loss/train': 2.3980045318603516} +11/06/2021 21:50:54 - INFO - __main__ - Step 4185: {'lr': 0.0004997313951740301, 'samples': 803520, 'steps': 4184, 'loss/train': 1.4753458499908447} +11/06/2021 21:50:54 - INFO - __main__ - Step 4186: {'lr': 0.0004997311491867083, 'samples': 803712, 'steps': 4185, 'loss/train': 1.5125452280044556} +11/06/2021 21:50:55 - INFO - __main__ - Step 4187: {'lr': 0.0004997309030868617, 'samples': 803904, 'steps': 4186, 'loss/train': 1.2969268560409546} +11/06/2021 21:50:55 - INFO - __main__ - Step 4188: {'lr': 0.0004997306568744901, 'samples': 804096, 'steps': 4187, 'loss/train': 2.0338566303253174} +11/06/2021 21:50:56 - INFO - __main__ - Step 4189: {'lr': 0.0004997304105495938, 'samples': 804288, 'steps': 4188, 'loss/train': 1.7441582679748535} +11/06/2021 21:50:57 - INFO - __main__ - Step 4190: {'lr': 0.0004997301641121727, 'samples': 804480, 'steps': 4189, 'loss/train': 2.200920581817627} +11/06/2021 21:50:57 - INFO - __main__ - Step 4191: {'lr': 0.0004997299175622271, 'samples': 804672, 'steps': 4190, 'loss/train': 2.2595231533050537} +11/06/2021 21:50:57 - INFO - __main__ - Step 4192: {'lr': 0.000499729670899757, 'samples': 804864, 'steps': 4191, 'loss/train': 2.5529255867004395} +11/06/2021 21:50:58 - INFO - __main__ - Step 4193: {'lr': 0.0004997294241247627, 'samples': 805056, 'steps': 4192, 'loss/train': 1.6093616485595703} +11/06/2021 21:50:59 - INFO - __main__ - Step 4194: {'lr': 0.0004997291772372441, 'samples': 805248, 'steps': 4193, 'loss/train': 1.4874943494796753} +11/06/2021 21:50:59 - INFO - __main__ - Step 4195: {'lr': 0.0004997289302372014, 'samples': 805440, 'steps': 4194, 'loss/train': 2.0579819679260254} +11/06/2021 21:51:00 - INFO - __main__ - Step 4196: {'lr': 0.0004997286831246347, 'samples': 805632, 'steps': 4195, 'loss/train': 2.4122848510742188} +11/06/2021 21:51:00 - INFO - __main__ - Step 4197: {'lr': 0.0004997284358995441, 'samples': 805824, 'steps': 4196, 'loss/train': 2.2387192249298096} +11/06/2021 21:51:00 - INFO - __main__ - Step 4198: {'lr': 0.0004997281885619297, 'samples': 806016, 'steps': 4197, 'loss/train': 1.6527743339538574} +11/06/2021 21:51:01 - INFO - __main__ - Step 4199: {'lr': 0.0004997279411117916, 'samples': 806208, 'steps': 4198, 'loss/train': 0.3961840569972992} +11/06/2021 21:51:02 - INFO - __main__ - Step 4200: {'lr': 0.00049972769354913, 'samples': 806400, 'steps': 4199, 'loss/train': 1.9782782793045044} +11/06/2021 21:51:02 - INFO - __main__ - Step 4201: {'lr': 0.0004997274458739449, 'samples': 806592, 'steps': 4200, 'loss/train': 2.000523328781128} +11/06/2021 21:51:02 - INFO - __main__ - Step 4202: {'lr': 0.0004997271980862366, 'samples': 806784, 'steps': 4201, 'loss/train': 2.5717737674713135} +11/06/2021 21:51:03 - INFO - __main__ - Step 4203: {'lr': 0.000499726950186005, 'samples': 806976, 'steps': 4202, 'loss/train': 2.567746639251709} +11/06/2021 21:51:03 - INFO - __main__ - Step 4204: {'lr': 0.0004997267021732502, 'samples': 807168, 'steps': 4203, 'loss/train': 2.4571382999420166} +11/06/2021 21:51:04 - INFO - __main__ - Step 4205: {'lr': 0.0004997264540479724, 'samples': 807360, 'steps': 4204, 'loss/train': 1.8436121940612793} +11/06/2021 21:51:05 - INFO - __main__ - Step 4206: {'lr': 0.0004997262058101719, 'samples': 807552, 'steps': 4205, 'loss/train': 2.192099094390869} +11/06/2021 21:51:05 - INFO - __main__ - Step 4207: {'lr': 0.0004997259574598485, 'samples': 807744, 'steps': 4206, 'loss/train': 2.6766111850738525} +11/06/2021 21:51:05 - INFO - __main__ - Step 4208: {'lr': 0.0004997257089970024, 'samples': 807936, 'steps': 4207, 'loss/train': 2.0918617248535156} +11/06/2021 21:51:06 - INFO - __main__ - Step 4209: {'lr': 0.0004997254604216338, 'samples': 808128, 'steps': 4208, 'loss/train': 2.2900002002716064} +11/06/2021 21:51:07 - INFO - __main__ - Step 4210: {'lr': 0.0004997252117337428, 'samples': 808320, 'steps': 4209, 'loss/train': 1.7111936807632446} +11/06/2021 21:51:07 - INFO - __main__ - Step 4211: {'lr': 0.0004997249629333294, 'samples': 808512, 'steps': 4210, 'loss/train': 2.1886565685272217} +11/06/2021 21:51:07 - INFO - __main__ - Step 4212: {'lr': 0.0004997247140203939, 'samples': 808704, 'steps': 4211, 'loss/train': 2.0272629261016846} +11/06/2021 21:51:08 - INFO - __main__ - Step 4213: {'lr': 0.0004997244649949362, 'samples': 808896, 'steps': 4212, 'loss/train': 1.792849063873291} +11/06/2021 21:51:08 - INFO - __main__ - Step 4214: {'lr': 0.0004997242158569564, 'samples': 809088, 'steps': 4213, 'loss/train': 1.8342564105987549} +11/06/2021 21:51:09 - INFO - __main__ - Step 4215: {'lr': 0.0004997239666064549, 'samples': 809280, 'steps': 4214, 'loss/train': 2.516932249069214} +11/06/2021 21:51:09 - INFO - __main__ - Step 4216: {'lr': 0.0004997237172434316, 'samples': 809472, 'steps': 4215, 'loss/train': 1.893647313117981} +11/06/2021 21:51:10 - INFO - __main__ - Step 4217: {'lr': 0.0004997234677678867, 'samples': 809664, 'steps': 4216, 'loss/train': 2.4590060710906982} +11/06/2021 21:51:10 - INFO - __main__ - Step 4218: {'lr': 0.0004997232181798201, 'samples': 809856, 'steps': 4217, 'loss/train': 1.6287667751312256} +11/06/2021 21:51:10 - INFO - __main__ - Step 4219: {'lr': 0.0004997229684792322, 'samples': 810048, 'steps': 4218, 'loss/train': 2.320136070251465} +11/06/2021 21:51:12 - INFO - __main__ - Step 4220: {'lr': 0.000499722718666123, 'samples': 810240, 'steps': 4219, 'loss/train': 2.140002965927124} +11/06/2021 21:51:12 - INFO - __main__ - Step 4221: {'lr': 0.0004997224687404926, 'samples': 810432, 'steps': 4220, 'loss/train': 2.0114235877990723} +11/06/2021 21:51:12 - INFO - __main__ - Step 4222: {'lr': 0.0004997222187023409, 'samples': 810624, 'steps': 4221, 'loss/train': 1.9719492197036743} +11/06/2021 21:51:13 - INFO - __main__ - Step 4223: {'lr': 0.0004997219685516684, 'samples': 810816, 'steps': 4222, 'loss/train': 2.0050837993621826} +11/06/2021 21:51:13 - INFO - __main__ - Step 4224: {'lr': 0.000499721718288475, 'samples': 811008, 'steps': 4223, 'loss/train': 1.0554298162460327} +11/06/2021 21:51:14 - INFO - __main__ - Step 4225: {'lr': 0.0004997214679127609, 'samples': 811200, 'steps': 4224, 'loss/train': 2.309093713760376} +11/06/2021 21:51:14 - INFO - __main__ - Step 4226: {'lr': 0.000499721217424526, 'samples': 811392, 'steps': 4225, 'loss/train': 1.7864500284194946} +11/06/2021 21:51:15 - INFO - __main__ - Step 4227: {'lr': 0.0004997209668237707, 'samples': 811584, 'steps': 4226, 'loss/train': 2.3149712085723877} +11/06/2021 21:51:15 - INFO - __main__ - Step 4228: {'lr': 0.0004997207161104951, 'samples': 811776, 'steps': 4227, 'loss/train': 2.2613799571990967} +11/06/2021 21:51:15 - INFO - __main__ - Step 4229: {'lr': 0.0004997204652846991, 'samples': 811968, 'steps': 4228, 'loss/train': 1.9725654125213623} +11/06/2021 21:51:16 - INFO - __main__ - Step 4230: {'lr': 0.0004997202143463828, 'samples': 812160, 'steps': 4229, 'loss/train': 2.0676584243774414} +11/06/2021 21:51:17 - INFO - __main__ - Step 4231: {'lr': 0.0004997199632955464, 'samples': 812352, 'steps': 4230, 'loss/train': 2.0852909088134766} +11/06/2021 21:51:17 - INFO - __main__ - Step 4232: {'lr': 0.0004997197121321903, 'samples': 812544, 'steps': 4231, 'loss/train': 2.0031850337982178} +11/06/2021 21:51:18 - INFO - __main__ - Step 4233: {'lr': 0.0004997194608563142, 'samples': 812736, 'steps': 4232, 'loss/train': 1.9812066555023193} +11/06/2021 21:51:18 - INFO - __main__ - Step 4234: {'lr': 0.0004997192094679183, 'samples': 812928, 'steps': 4233, 'loss/train': 2.6864309310913086} +11/06/2021 21:51:18 - INFO - __main__ - Step 4235: {'lr': 0.0004997189579670028, 'samples': 813120, 'steps': 4234, 'loss/train': 2.032951831817627} +11/06/2021 21:51:19 - INFO - __main__ - Step 4236: {'lr': 0.0004997187063535679, 'samples': 813312, 'steps': 4235, 'loss/train': 2.289562463760376} +11/06/2021 21:51:20 - INFO - __main__ - Step 4237: {'lr': 0.0004997184546276135, 'samples': 813504, 'steps': 4236, 'loss/train': 1.5230915546417236} +11/06/2021 21:51:20 - INFO - __main__ - Step 4238: {'lr': 0.0004997182027891399, 'samples': 813696, 'steps': 4237, 'loss/train': 2.07342529296875} +11/06/2021 21:51:21 - INFO - __main__ - Step 4239: {'lr': 0.000499717950838147, 'samples': 813888, 'steps': 4238, 'loss/train': 1.0521665811538696} +11/06/2021 21:51:21 - INFO - __main__ - Step 4240: {'lr': 0.0004997176987746352, 'samples': 814080, 'steps': 4239, 'loss/train': 2.1802866458892822} +11/06/2021 21:51:21 - INFO - __main__ - Step 4241: {'lr': 0.0004997174465986043, 'samples': 814272, 'steps': 4240, 'loss/train': 1.9899753332138062} +11/06/2021 21:51:23 - INFO - __main__ - Step 4242: {'lr': 0.0004997171943100547, 'samples': 814464, 'steps': 4241, 'loss/train': 1.9145240783691406} +11/06/2021 21:51:23 - INFO - __main__ - Step 4243: {'lr': 0.0004997169419089863, 'samples': 814656, 'steps': 4242, 'loss/train': 2.2730929851531982} +11/06/2021 21:51:23 - INFO - __main__ - Step 4244: {'lr': 0.0004997166893953994, 'samples': 814848, 'steps': 4243, 'loss/train': 2.227478504180908} +11/06/2021 21:51:24 - INFO - __main__ - Step 4245: {'lr': 0.000499716436769294, 'samples': 815040, 'steps': 4244, 'loss/train': 1.7130650281906128} +11/06/2021 21:51:24 - INFO - __main__ - Step 4246: {'lr': 0.0004997161840306701, 'samples': 815232, 'steps': 4245, 'loss/train': 2.1107656955718994} +11/06/2021 21:51:25 - INFO - __main__ - Step 4247: {'lr': 0.0004997159311795281, 'samples': 815424, 'steps': 4246, 'loss/train': 2.0193605422973633} +11/06/2021 21:51:25 - INFO - __main__ - Step 4248: {'lr': 0.0004997156782158679, 'samples': 815616, 'steps': 4247, 'loss/train': 2.169619083404541} +11/06/2021 21:51:26 - INFO - __main__ - Step 4249: {'lr': 0.0004997154251396896, 'samples': 815808, 'steps': 4248, 'loss/train': 1.5952482223510742} +11/06/2021 21:51:26 - INFO - __main__ - Step 4250: {'lr': 0.0004997151719509935, 'samples': 816000, 'steps': 4249, 'loss/train': 2.200782060623169} +11/06/2021 21:51:26 - INFO - __main__ - Step 4251: {'lr': 0.0004997149186497795, 'samples': 816192, 'steps': 4250, 'loss/train': 2.353931188583374} +11/06/2021 21:51:27 - INFO - __main__ - Step 4252: {'lr': 0.0004997146652360478, 'samples': 816384, 'steps': 4251, 'loss/train': 1.8407737016677856} +11/06/2021 21:51:28 - INFO - __main__ - Step 4253: {'lr': 0.0004997144117097986, 'samples': 816576, 'steps': 4252, 'loss/train': 1.8652644157409668} +11/06/2021 21:51:28 - INFO - __main__ - Step 4254: {'lr': 0.0004997141580710318, 'samples': 816768, 'steps': 4253, 'loss/train': 2.0572428703308105} +11/06/2021 21:51:28 - INFO - __main__ - Step 4255: {'lr': 0.0004997139043197478, 'samples': 816960, 'steps': 4254, 'loss/train': 1.7917412519454956} +11/06/2021 21:51:29 - INFO - __main__ - Step 4256: {'lr': 0.0004997136504559465, 'samples': 817152, 'steps': 4255, 'loss/train': 1.9230844974517822} +11/06/2021 21:51:30 - INFO - __main__ - Step 4257: {'lr': 0.0004997133964796281, 'samples': 817344, 'steps': 4256, 'loss/train': 2.0481159687042236} +11/06/2021 21:51:30 - INFO - __main__ - Step 4258: {'lr': 0.0004997131423907927, 'samples': 817536, 'steps': 4257, 'loss/train': 2.003450632095337} +11/06/2021 21:51:31 - INFO - __main__ - Step 4259: {'lr': 0.0004997128881894404, 'samples': 817728, 'steps': 4258, 'loss/train': 2.5174543857574463} +11/06/2021 21:51:31 - INFO - __main__ - Step 4260: {'lr': 0.0004997126338755714, 'samples': 817920, 'steps': 4259, 'loss/train': 2.247880697250366} +11/06/2021 21:51:31 - INFO - __main__ - Step 4261: {'lr': 0.0004997123794491856, 'samples': 818112, 'steps': 4260, 'loss/train': 2.505103349685669} +11/06/2021 21:51:32 - INFO - __main__ - Step 4262: {'lr': 0.0004997121249102834, 'samples': 818304, 'steps': 4261, 'loss/train': 1.9285527467727661} +11/06/2021 21:51:33 - INFO - __main__ - Step 4263: {'lr': 0.0004997118702588647, 'samples': 818496, 'steps': 4262, 'loss/train': 2.225656509399414} +11/06/2021 21:51:33 - INFO - __main__ - Step 4264: {'lr': 0.0004997116154949297, 'samples': 818688, 'steps': 4263, 'loss/train': 1.5641311407089233} +11/06/2021 21:51:34 - INFO - __main__ - Step 4265: {'lr': 0.0004997113606184785, 'samples': 818880, 'steps': 4264, 'loss/train': 1.9400560855865479} +11/06/2021 21:51:34 - INFO - __main__ - Step 4266: {'lr': 0.0004997111056295111, 'samples': 819072, 'steps': 4265, 'loss/train': 2.0672645568847656} +11/06/2021 21:51:35 - INFO - __main__ - Step 4267: {'lr': 0.0004997108505280279, 'samples': 819264, 'steps': 4266, 'loss/train': 2.7679026126861572} +11/06/2021 21:51:35 - INFO - __main__ - Step 4268: {'lr': 0.0004997105953140288, 'samples': 819456, 'steps': 4267, 'loss/train': 1.6954803466796875} +11/06/2021 21:51:36 - INFO - __main__ - Step 4269: {'lr': 0.0004997103399875139, 'samples': 819648, 'steps': 4268, 'loss/train': 1.9309132099151611} +11/06/2021 21:51:36 - INFO - __main__ - Step 4270: {'lr': 0.0004997100845484834, 'samples': 819840, 'steps': 4269, 'loss/train': 1.524571418762207} +11/06/2021 21:51:37 - INFO - __main__ - Step 4271: {'lr': 0.0004997098289969374, 'samples': 820032, 'steps': 4270, 'loss/train': 1.9430183172225952} +11/06/2021 21:51:37 - INFO - __main__ - Step 4272: {'lr': 0.0004997095733328761, 'samples': 820224, 'steps': 4271, 'loss/train': 2.232881784439087} +11/06/2021 21:51:38 - INFO - __main__ - Step 4273: {'lr': 0.0004997093175562994, 'samples': 820416, 'steps': 4272, 'loss/train': 2.1205177307128906} +11/06/2021 21:51:38 - INFO - __main__ - Step 4274: {'lr': 0.0004997090616672076, 'samples': 820608, 'steps': 4273, 'loss/train': 2.2687668800354004} +11/06/2021 21:51:39 - INFO - __main__ - Step 4275: {'lr': 0.0004997088056656006, 'samples': 820800, 'steps': 4274, 'loss/train': 2.34332275390625} +11/06/2021 21:51:39 - INFO - __main__ - Step 4276: {'lr': 0.0004997085495514788, 'samples': 820992, 'steps': 4275, 'loss/train': 2.0807552337646484} +11/06/2021 21:51:39 - INFO - __main__ - Step 4277: {'lr': 0.0004997082933248421, 'samples': 821184, 'steps': 4276, 'loss/train': 2.0649728775024414} +11/06/2021 21:51:40 - INFO - __main__ - Step 4278: {'lr': 0.0004997080369856907, 'samples': 821376, 'steps': 4277, 'loss/train': 2.0820047855377197} +11/06/2021 21:51:41 - INFO - __main__ - Step 4279: {'lr': 0.0004997077805340248, 'samples': 821568, 'steps': 4278, 'loss/train': 1.6447721719741821} +11/06/2021 21:51:41 - INFO - __main__ - Step 4280: {'lr': 0.0004997075239698445, 'samples': 821760, 'steps': 4279, 'loss/train': 1.9901349544525146} +11/06/2021 21:51:41 - INFO - __main__ - Step 4281: {'lr': 0.0004997072672931497, 'samples': 821952, 'steps': 4280, 'loss/train': 2.4467787742614746} +11/06/2021 21:51:42 - INFO - __main__ - Step 4282: {'lr': 0.0004997070105039407, 'samples': 822144, 'steps': 4281, 'loss/train': 1.6936836242675781} +11/06/2021 21:51:43 - INFO - __main__ - Step 4283: {'lr': 0.0004997067536022176, 'samples': 822336, 'steps': 4282, 'loss/train': 2.122401475906372} +11/06/2021 21:51:43 - INFO - __main__ - Step 4284: {'lr': 0.0004997064965879804, 'samples': 822528, 'steps': 4283, 'loss/train': 2.0260608196258545} +11/06/2021 21:51:44 - INFO - __main__ - Step 4285: {'lr': 0.0004997062394612293, 'samples': 822720, 'steps': 4284, 'loss/train': 2.1867868900299072} +11/06/2021 21:51:44 - INFO - __main__ - Step 4286: {'lr': 0.0004997059822219645, 'samples': 822912, 'steps': 4285, 'loss/train': 2.057260274887085} +11/06/2021 21:51:44 - INFO - __main__ - Step 4287: {'lr': 0.000499705724870186, 'samples': 823104, 'steps': 4286, 'loss/train': 2.2277965545654297} +11/06/2021 21:51:45 - INFO - __main__ - Step 4288: {'lr': 0.0004997054674058941, 'samples': 823296, 'steps': 4287, 'loss/train': 2.590022325515747} +11/06/2021 21:51:46 - INFO - __main__ - Step 4289: {'lr': 0.0004997052098290886, 'samples': 823488, 'steps': 4288, 'loss/train': 2.015610694885254} +11/06/2021 21:51:46 - INFO - __main__ - Step 4290: {'lr': 0.0004997049521397698, 'samples': 823680, 'steps': 4289, 'loss/train': 2.311326503753662} +11/06/2021 21:51:46 - INFO - __main__ - Step 4291: {'lr': 0.0004997046943379379, 'samples': 823872, 'steps': 4290, 'loss/train': 1.8215492963790894} +11/06/2021 21:51:47 - INFO - __main__ - Step 4292: {'lr': 0.0004997044364235928, 'samples': 824064, 'steps': 4291, 'loss/train': 1.7921706438064575} +11/06/2021 21:51:47 - INFO - __main__ - Step 4293: {'lr': 0.0004997041783967348, 'samples': 824256, 'steps': 4292, 'loss/train': 2.276956558227539} +11/06/2021 21:51:48 - INFO - __main__ - Step 4294: {'lr': 0.0004997039202573639, 'samples': 824448, 'steps': 4293, 'loss/train': 1.8650037050247192} +11/06/2021 21:51:48 - INFO - __main__ - Step 4295: {'lr': 0.0004997036620054803, 'samples': 824640, 'steps': 4294, 'loss/train': 2.3925178050994873} +11/06/2021 21:51:49 - INFO - __main__ - Step 4296: {'lr': 0.0004997034036410841, 'samples': 824832, 'steps': 4295, 'loss/train': 1.9569441080093384} +11/06/2021 21:51:49 - INFO - __main__ - Step 4297: {'lr': 0.0004997031451641754, 'samples': 825024, 'steps': 4296, 'loss/train': 1.8525234460830688} +11/06/2021 21:51:49 - INFO - __main__ - Step 4298: {'lr': 0.0004997028865747542, 'samples': 825216, 'steps': 4297, 'loss/train': 2.4801597595214844} +11/06/2021 21:51:51 - INFO - __main__ - Step 4299: {'lr': 0.0004997026278728209, 'samples': 825408, 'steps': 4298, 'loss/train': 2.3479583263397217} +11/06/2021 21:51:51 - INFO - __main__ - Step 4300: {'lr': 0.0004997023690583753, 'samples': 825600, 'steps': 4299, 'loss/train': 1.8593815565109253} +11/06/2021 21:51:51 - INFO - __main__ - Step 4301: {'lr': 0.0004997021101314179, 'samples': 825792, 'steps': 4300, 'loss/train': 2.492985248565674} +11/06/2021 21:51:52 - INFO - __main__ - Step 4302: {'lr': 0.0004997018510919483, 'samples': 825984, 'steps': 4301, 'loss/train': 1.1239334344863892} +11/06/2021 21:51:52 - INFO - __main__ - Step 4303: {'lr': 0.0004997015919399671, 'samples': 826176, 'steps': 4302, 'loss/train': 2.068119525909424} +11/06/2021 21:51:53 - INFO - __main__ - Step 4304: {'lr': 0.0004997013326754742, 'samples': 826368, 'steps': 4303, 'loss/train': 2.1923468112945557} +11/06/2021 21:51:53 - INFO - __main__ - Step 4305: {'lr': 0.0004997010732984696, 'samples': 826560, 'steps': 4304, 'loss/train': 2.267517566680908} +11/06/2021 21:51:54 - INFO - __main__ - Step 4306: {'lr': 0.0004997008138089536, 'samples': 826752, 'steps': 4305, 'loss/train': 2.289822816848755} +11/06/2021 21:51:54 - INFO - __main__ - Step 4307: {'lr': 0.0004997005542069263, 'samples': 826944, 'steps': 4306, 'loss/train': 2.516078233718872} +11/06/2021 21:51:54 - INFO - __main__ - Step 4308: {'lr': 0.0004997002944923878, 'samples': 827136, 'steps': 4307, 'loss/train': 2.071676731109619} +11/06/2021 21:51:55 - INFO - __main__ - Step 4309: {'lr': 0.0004997000346653381, 'samples': 827328, 'steps': 4308, 'loss/train': 2.0077381134033203} +11/06/2021 21:51:56 - INFO - __main__ - Step 4310: {'lr': 0.0004996997747257775, 'samples': 827520, 'steps': 4309, 'loss/train': 2.347663640975952} +11/06/2021 21:51:56 - INFO - __main__ - Step 4311: {'lr': 0.000499699514673706, 'samples': 827712, 'steps': 4310, 'loss/train': 1.8493750095367432} +11/06/2021 21:51:56 - INFO - __main__ - Step 4312: {'lr': 0.0004996992545091239, 'samples': 827904, 'steps': 4311, 'loss/train': 1.9490984678268433} +11/06/2021 21:51:57 - INFO - __main__ - Step 4313: {'lr': 0.000499698994232031, 'samples': 828096, 'steps': 4312, 'loss/train': 2.2209248542785645} +11/06/2021 21:51:57 - INFO - __main__ - Step 4314: {'lr': 0.0004996987338424276, 'samples': 828288, 'steps': 4313, 'loss/train': 2.120884418487549} +11/06/2021 21:51:58 - INFO - __main__ - Step 4315: {'lr': 0.0004996984733403138, 'samples': 828480, 'steps': 4314, 'loss/train': 2.1321933269500732} +11/06/2021 21:51:59 - INFO - __main__ - Step 4316: {'lr': 0.0004996982127256898, 'samples': 828672, 'steps': 4315, 'loss/train': 2.0887527465820312} +11/06/2021 21:51:59 - INFO - __main__ - Step 4317: {'lr': 0.0004996979519985556, 'samples': 828864, 'steps': 4316, 'loss/train': 2.1263225078582764} +11/06/2021 21:51:59 - INFO - __main__ - Step 4318: {'lr': 0.0004996976911589114, 'samples': 829056, 'steps': 4317, 'loss/train': 1.8161555528640747} +11/06/2021 21:52:00 - INFO - __main__ - Step 4319: {'lr': 0.0004996974302067572, 'samples': 829248, 'steps': 4318, 'loss/train': 1.67631995677948} +11/06/2021 21:52:01 - INFO - __main__ - Step 4320: {'lr': 0.0004996971691420931, 'samples': 829440, 'steps': 4319, 'loss/train': 1.9163763523101807} +11/06/2021 21:52:01 - INFO - __main__ - Step 4321: {'lr': 0.0004996969079649195, 'samples': 829632, 'steps': 4320, 'loss/train': 1.8467737436294556} +11/06/2021 21:52:01 - INFO - __main__ - Step 4322: {'lr': 0.0004996966466752362, 'samples': 829824, 'steps': 4321, 'loss/train': 2.3159868717193604} +11/06/2021 21:52:02 - INFO - __main__ - Step 4323: {'lr': 0.0004996963852730436, 'samples': 830016, 'steps': 4322, 'loss/train': 1.9152145385742188} +11/06/2021 21:52:02 - INFO - __main__ - Step 4324: {'lr': 0.0004996961237583415, 'samples': 830208, 'steps': 4323, 'loss/train': 2.11564302444458} +11/06/2021 21:52:03 - INFO - __main__ - Step 4325: {'lr': 0.0004996958621311302, 'samples': 830400, 'steps': 4324, 'loss/train': 2.3892369270324707} +11/06/2021 21:52:03 - INFO - __main__ - Step 4326: {'lr': 0.00049969560039141, 'samples': 830592, 'steps': 4325, 'loss/train': 1.4963157176971436} +11/06/2021 21:52:04 - INFO - __main__ - Step 4327: {'lr': 0.0004996953385391806, 'samples': 830784, 'steps': 4326, 'loss/train': 2.2413148880004883} +11/06/2021 21:52:04 - INFO - __main__ - Step 4328: {'lr': 0.0004996950765744424, 'samples': 830976, 'steps': 4327, 'loss/train': 1.8104511499404907} +11/06/2021 21:52:04 - INFO - __main__ - Step 4329: {'lr': 0.0004996948144971953, 'samples': 831168, 'steps': 4328, 'loss/train': 1.7227517366409302} +11/06/2021 21:52:05 - INFO - __main__ - Step 4330: {'lr': 0.0004996945523074398, 'samples': 831360, 'steps': 4329, 'loss/train': 1.6873306035995483} +11/06/2021 21:52:06 - INFO - __main__ - Step 4331: {'lr': 0.0004996942900051757, 'samples': 831552, 'steps': 4330, 'loss/train': 2.224438190460205} +11/06/2021 21:52:06 - INFO - __main__ - Step 4332: {'lr': 0.0004996940275904031, 'samples': 831744, 'steps': 4331, 'loss/train': 2.1473422050476074} +11/06/2021 21:52:07 - INFO - __main__ - Step 4333: {'lr': 0.0004996937650631224, 'samples': 831936, 'steps': 4332, 'loss/train': 2.5668904781341553} +11/06/2021 21:52:07 - INFO - __main__ - Step 4334: {'lr': 0.0004996935024233335, 'samples': 832128, 'steps': 4333, 'loss/train': 2.192603349685669} +11/06/2021 21:52:08 - INFO - __main__ - Step 4335: {'lr': 0.0004996932396710365, 'samples': 832320, 'steps': 4334, 'loss/train': 1.7712533473968506} +11/06/2021 21:52:08 - INFO - __main__ - Step 4336: {'lr': 0.0004996929768062316, 'samples': 832512, 'steps': 4335, 'loss/train': 1.558101773262024} +11/06/2021 21:52:09 - INFO - __main__ - Step 4337: {'lr': 0.0004996927138289189, 'samples': 832704, 'steps': 4336, 'loss/train': 2.441239833831787} +11/06/2021 21:52:09 - INFO - __main__ - Step 4338: {'lr': 0.0004996924507390985, 'samples': 832896, 'steps': 4337, 'loss/train': 2.24872088432312} +11/06/2021 21:52:09 - INFO - __main__ - Step 4339: {'lr': 0.0004996921875367705, 'samples': 833088, 'steps': 4338, 'loss/train': 2.0886828899383545} +11/06/2021 21:52:10 - INFO - __main__ - Step 4340: {'lr': 0.0004996919242219352, 'samples': 833280, 'steps': 4339, 'loss/train': 2.2574408054351807} +11/06/2021 21:52:11 - INFO - __main__ - Step 4341: {'lr': 0.0004996916607945925, 'samples': 833472, 'steps': 4340, 'loss/train': 1.8286736011505127} +11/06/2021 21:52:11 - INFO - __main__ - Step 4342: {'lr': 0.0004996913972547426, 'samples': 833664, 'steps': 4341, 'loss/train': 2.018918037414551} +11/06/2021 21:52:11 - INFO - __main__ - Step 4343: {'lr': 0.0004996911336023855, 'samples': 833856, 'steps': 4342, 'loss/train': 2.208406925201416} +11/06/2021 21:52:12 - INFO - __main__ - Step 4344: {'lr': 0.0004996908698375216, 'samples': 834048, 'steps': 4343, 'loss/train': 1.9386653900146484} +11/06/2021 21:52:12 - INFO - __main__ - Step 4345: {'lr': 0.0004996906059601507, 'samples': 834240, 'steps': 4344, 'loss/train': 1.8494505882263184} +11/06/2021 21:52:13 - INFO - __main__ - Step 4346: {'lr': 0.0004996903419702731, 'samples': 834432, 'steps': 4345, 'loss/train': 2.3450777530670166} +11/06/2021 21:52:13 - INFO - __main__ - Step 4347: {'lr': 0.0004996900778678889, 'samples': 834624, 'steps': 4346, 'loss/train': 2.0560898780822754} +11/06/2021 21:52:14 - INFO - __main__ - Step 4348: {'lr': 0.0004996898136529982, 'samples': 834816, 'steps': 4347, 'loss/train': 2.482868194580078} +11/06/2021 21:52:14 - INFO - __main__ - Step 4349: {'lr': 0.0004996895493256012, 'samples': 835008, 'steps': 4348, 'loss/train': 1.759129524230957} +11/06/2021 21:52:14 - INFO - __main__ - Step 4350: {'lr': 0.0004996892848856978, 'samples': 835200, 'steps': 4349, 'loss/train': 1.8137215375900269} +11/06/2021 21:52:16 - INFO - __main__ - Step 4351: {'lr': 0.0004996890203332883, 'samples': 835392, 'steps': 4350, 'loss/train': 1.9098490476608276} +11/06/2021 21:52:16 - INFO - __main__ - Step 4352: {'lr': 0.0004996887556683729, 'samples': 835584, 'steps': 4351, 'loss/train': 2.027623414993286} +11/06/2021 21:52:16 - INFO - __main__ - Step 4353: {'lr': 0.0004996884908909515, 'samples': 835776, 'steps': 4352, 'loss/train': 2.083651304244995} +11/06/2021 21:52:17 - INFO - __main__ - Step 4354: {'lr': 0.0004996882260010243, 'samples': 835968, 'steps': 4353, 'loss/train': 1.6562211513519287} +11/06/2021 21:52:17 - INFO - __main__ - Step 4355: {'lr': 0.0004996879609985915, 'samples': 836160, 'steps': 4354, 'loss/train': 1.846291422843933} +11/06/2021 21:52:18 - INFO - __main__ - Step 4356: {'lr': 0.0004996876958836532, 'samples': 836352, 'steps': 4355, 'loss/train': 2.066518783569336} +11/06/2021 21:52:19 - INFO - __main__ - Step 4357: {'lr': 0.0004996874306562093, 'samples': 836544, 'steps': 4356, 'loss/train': 2.2601191997528076} +11/06/2021 21:52:19 - INFO - __main__ - Step 4358: {'lr': 0.0004996871653162602, 'samples': 836736, 'steps': 4357, 'loss/train': 2.134087562561035} +11/06/2021 21:52:19 - INFO - __main__ - Step 4359: {'lr': 0.0004996868998638059, 'samples': 836928, 'steps': 4358, 'loss/train': 2.3234333992004395} +11/06/2021 21:52:20 - INFO - __main__ - Step 4360: {'lr': 0.0004996866342988467, 'samples': 837120, 'steps': 4359, 'loss/train': 2.3369786739349365} +11/06/2021 21:52:20 - INFO - __main__ - Step 4361: {'lr': 0.0004996863686213823, 'samples': 837312, 'steps': 4360, 'loss/train': 2.203856945037842} +11/06/2021 21:52:21 - INFO - __main__ - Step 4362: {'lr': 0.0004996861028314133, 'samples': 837504, 'steps': 4361, 'loss/train': 2.04062557220459} +11/06/2021 21:52:21 - INFO - __main__ - Step 4363: {'lr': 0.0004996858369289394, 'samples': 837696, 'steps': 4362, 'loss/train': 2.0130574703216553} +11/06/2021 21:52:22 - INFO - __main__ - Step 4364: {'lr': 0.000499685570913961, 'samples': 837888, 'steps': 4363, 'loss/train': 1.978306770324707} +11/06/2021 21:52:22 - INFO - __main__ - Step 4365: {'lr': 0.0004996853047864781, 'samples': 838080, 'steps': 4364, 'loss/train': 2.3143999576568604} +11/06/2021 21:52:22 - INFO - __main__ - Step 4366: {'lr': 0.0004996850385464909, 'samples': 838272, 'steps': 4365, 'loss/train': 2.2573633193969727} +11/06/2021 21:52:23 - INFO - __main__ - Step 4367: {'lr': 0.0004996847721939994, 'samples': 838464, 'steps': 4366, 'loss/train': 1.7779031991958618} +11/06/2021 21:52:24 - INFO - __main__ - Step 4368: {'lr': 0.0004996845057290039, 'samples': 838656, 'steps': 4367, 'loss/train': 2.1156513690948486} +11/06/2021 21:52:24 - INFO - __main__ - Step 4369: {'lr': 0.0004996842391515044, 'samples': 838848, 'steps': 4368, 'loss/train': 1.8346737623214722} +11/06/2021 21:52:25 - INFO - __main__ - Step 4370: {'lr': 0.000499683972461501, 'samples': 839040, 'steps': 4369, 'loss/train': 1.7656928300857544} +11/06/2021 21:52:25 - INFO - __main__ - Step 4371: {'lr': 0.0004996837056589938, 'samples': 839232, 'steps': 4370, 'loss/train': 1.4817529916763306} +11/06/2021 21:52:25 - INFO - __main__ - Step 4372: {'lr': 0.0004996834387439831, 'samples': 839424, 'steps': 4371, 'loss/train': 2.4186854362487793} +11/06/2021 21:52:26 - INFO - __main__ - Step 4373: {'lr': 0.0004996831717164689, 'samples': 839616, 'steps': 4372, 'loss/train': 2.3830738067626953} +11/06/2021 21:52:27 - INFO - __main__ - Step 4374: {'lr': 0.0004996829045764512, 'samples': 839808, 'steps': 4373, 'loss/train': 2.039133310317993} +11/06/2021 21:52:27 - INFO - __main__ - Step 4375: {'lr': 0.0004996826373239303, 'samples': 840000, 'steps': 4374, 'loss/train': 1.8050706386566162} +11/06/2021 21:52:27 - INFO - __main__ - Step 4376: {'lr': 0.0004996823699589062, 'samples': 840192, 'steps': 4375, 'loss/train': 2.005566120147705} +11/06/2021 21:52:28 - INFO - __main__ - Step 4377: {'lr': 0.0004996821024813791, 'samples': 840384, 'steps': 4376, 'loss/train': 2.3006296157836914} +11/06/2021 21:52:29 - INFO - __main__ - Step 4378: {'lr': 0.0004996818348913491, 'samples': 840576, 'steps': 4377, 'loss/train': 1.9584013223648071} +11/06/2021 21:52:29 - INFO - __main__ - Step 4379: {'lr': 0.0004996815671888163, 'samples': 840768, 'steps': 4378, 'loss/train': 2.180757522583008} +11/06/2021 21:52:29 - INFO - __main__ - Step 4380: {'lr': 0.000499681299373781, 'samples': 840960, 'steps': 4379, 'loss/train': 2.559288740158081} +11/06/2021 21:52:30 - INFO - __main__ - Step 4381: {'lr': 0.0004996810314462429, 'samples': 841152, 'steps': 4380, 'loss/train': 1.7387698888778687} +11/06/2021 21:52:30 - INFO - __main__ - Step 4382: {'lr': 0.0004996807634062025, 'samples': 841344, 'steps': 4381, 'loss/train': 2.247429847717285} +11/06/2021 21:52:31 - INFO - __main__ - Step 4383: {'lr': 0.0004996804952536599, 'samples': 841536, 'steps': 4382, 'loss/train': 2.5863077640533447} +11/06/2021 21:52:31 - INFO - __main__ - Step 4384: {'lr': 0.0004996802269886149, 'samples': 841728, 'steps': 4383, 'loss/train': 1.9979889392852783} +11/06/2021 21:52:32 - INFO - __main__ - Step 4385: {'lr': 0.0004996799586110681, 'samples': 841920, 'steps': 4384, 'loss/train': 2.161149501800537} +11/06/2021 21:52:32 - INFO - __main__ - Step 4386: {'lr': 0.0004996796901210192, 'samples': 842112, 'steps': 4385, 'loss/train': 2.0866355895996094} +11/06/2021 21:52:32 - INFO - __main__ - Step 4387: {'lr': 0.0004996794215184685, 'samples': 842304, 'steps': 4386, 'loss/train': 2.5882389545440674} +11/06/2021 21:52:33 - INFO - __main__ - Step 4388: {'lr': 0.0004996791528034161, 'samples': 842496, 'steps': 4387, 'loss/train': 1.5546870231628418} +11/06/2021 21:52:34 - INFO - __main__ - Step 4389: {'lr': 0.0004996788839758622, 'samples': 842688, 'steps': 4388, 'loss/train': 2.4196763038635254} +11/06/2021 21:52:34 - INFO - __main__ - Step 4390: {'lr': 0.0004996786150358068, 'samples': 842880, 'steps': 4389, 'loss/train': 1.6892547607421875} +11/06/2021 21:52:35 - INFO - __main__ - Step 4391: {'lr': 0.00049967834598325, 'samples': 843072, 'steps': 4390, 'loss/train': 2.1776304244995117} +11/06/2021 21:52:35 - INFO - __main__ - Step 4392: {'lr': 0.0004996780768181921, 'samples': 843264, 'steps': 4391, 'loss/train': 2.4177329540252686} +11/06/2021 21:52:35 - INFO - __main__ - Step 4393: {'lr': 0.0004996778075406331, 'samples': 843456, 'steps': 4392, 'loss/train': 1.8474143743515015} +11/06/2021 21:52:36 - INFO - __main__ - Step 4394: {'lr': 0.0004996775381505731, 'samples': 843648, 'steps': 4393, 'loss/train': 1.766103744506836} +11/06/2021 21:52:37 - INFO - __main__ - Step 4395: {'lr': 0.0004996772686480122, 'samples': 843840, 'steps': 4394, 'loss/train': 2.221249580383301} +11/06/2021 21:52:37 - INFO - __main__ - Step 4396: {'lr': 0.0004996769990329507, 'samples': 844032, 'steps': 4395, 'loss/train': 1.950240135192871} +11/06/2021 21:52:37 - INFO - __main__ - Step 4397: {'lr': 0.0004996767293053885, 'samples': 844224, 'steps': 4396, 'loss/train': 1.8675569295883179} +11/06/2021 21:52:38 - INFO - __main__ - Step 4398: {'lr': 0.0004996764594653258, 'samples': 844416, 'steps': 4397, 'loss/train': 2.6407816410064697} +11/06/2021 21:52:39 - INFO - __main__ - Step 4399: {'lr': 0.0004996761895127628, 'samples': 844608, 'steps': 4398, 'loss/train': 1.6900591850280762} +11/06/2021 21:52:39 - INFO - __main__ - Step 4400: {'lr': 0.0004996759194476996, 'samples': 844800, 'steps': 4399, 'loss/train': 0.33388879895210266} +11/06/2021 21:52:39 - INFO - __main__ - Step 4401: {'lr': 0.0004996756492701362, 'samples': 844992, 'steps': 4400, 'loss/train': 1.999221682548523} +11/06/2021 21:52:40 - INFO - __main__ - Step 4402: {'lr': 0.0004996753789800729, 'samples': 845184, 'steps': 4401, 'loss/train': 2.3262462615966797} +11/06/2021 21:52:40 - INFO - __main__ - Step 4403: {'lr': 0.0004996751085775096, 'samples': 845376, 'steps': 4402, 'loss/train': 2.0857207775115967} +11/06/2021 21:52:41 - INFO - __main__ - Step 4404: {'lr': 0.0004996748380624467, 'samples': 845568, 'steps': 4403, 'loss/train': 1.382709264755249} +11/06/2021 21:52:41 - INFO - __main__ - Step 4405: {'lr': 0.000499674567434884, 'samples': 845760, 'steps': 4404, 'loss/train': 2.260540008544922} +11/06/2021 21:52:42 - INFO - __main__ - Step 4406: {'lr': 0.0004996742966948219, 'samples': 845952, 'steps': 4405, 'loss/train': 1.8191969394683838} +11/06/2021 21:52:42 - INFO - __main__ - Step 4407: {'lr': 0.0004996740258422604, 'samples': 846144, 'steps': 4406, 'loss/train': 2.2261736392974854} +11/06/2021 21:52:43 - INFO - __main__ - Step 4408: {'lr': 0.0004996737548771997, 'samples': 846336, 'steps': 4407, 'loss/train': 1.8432106971740723} +11/06/2021 21:52:44 - INFO - __main__ - Step 4409: {'lr': 0.0004996734837996397, 'samples': 846528, 'steps': 4408, 'loss/train': 2.118229627609253} +11/06/2021 21:52:44 - INFO - __main__ - Step 4410: {'lr': 0.0004996732126095807, 'samples': 846720, 'steps': 4409, 'loss/train': 1.7854758501052856} +11/06/2021 21:52:44 - INFO - __main__ - Step 4411: {'lr': 0.0004996729413070229, 'samples': 846912, 'steps': 4410, 'loss/train': 2.3659751415252686} +11/06/2021 21:52:45 - INFO - __main__ - Step 4412: {'lr': 0.0004996726698919664, 'samples': 847104, 'steps': 4411, 'loss/train': 1.817520260810852} +11/06/2021 21:52:45 - INFO - __main__ - Step 4413: {'lr': 0.0004996723983644112, 'samples': 847296, 'steps': 4412, 'loss/train': 1.4988713264465332} +11/06/2021 21:52:46 - INFO - __main__ - Step 4414: {'lr': 0.0004996721267243573, 'samples': 847488, 'steps': 4413, 'loss/train': 1.2573717832565308} +11/06/2021 21:52:47 - INFO - __main__ - Step 4415: {'lr': 0.0004996718549718051, 'samples': 847680, 'steps': 4414, 'loss/train': 1.9494376182556152} +11/06/2021 21:52:47 - INFO - __main__ - Step 4416: {'lr': 0.0004996715831067546, 'samples': 847872, 'steps': 4415, 'loss/train': 0.341790109872818} +11/06/2021 21:52:47 - INFO - __main__ - Step 4417: {'lr': 0.000499671311129206, 'samples': 848064, 'steps': 4416, 'loss/train': 1.7873398065567017} +11/06/2021 21:52:48 - INFO - __main__ - Step 4418: {'lr': 0.0004996710390391593, 'samples': 848256, 'steps': 4417, 'loss/train': 2.2925448417663574} +11/06/2021 21:52:49 - INFO - __main__ - Step 4419: {'lr': 0.0004996707668366147, 'samples': 848448, 'steps': 4418, 'loss/train': 2.3310353755950928} +11/06/2021 21:52:49 - INFO - __main__ - Step 4420: {'lr': 0.0004996704945215724, 'samples': 848640, 'steps': 4419, 'loss/train': 1.234442949295044} +11/06/2021 21:52:49 - INFO - __main__ - Step 4421: {'lr': 0.0004996702220940322, 'samples': 848832, 'steps': 4420, 'loss/train': 2.263622522354126} +11/06/2021 21:52:50 - INFO - __main__ - Step 4422: {'lr': 0.0004996699495539947, 'samples': 849024, 'steps': 4421, 'loss/train': 2.1597673892974854} +11/06/2021 21:52:50 - INFO - __main__ - Step 4423: {'lr': 0.0004996696769014596, 'samples': 849216, 'steps': 4422, 'loss/train': 2.2731714248657227} +11/06/2021 21:52:50 - INFO - __main__ - Step 4424: {'lr': 0.0004996694041364272, 'samples': 849408, 'steps': 4423, 'loss/train': 2.049422264099121} +11/06/2021 21:52:51 - INFO - __main__ - Step 4425: {'lr': 0.0004996691312588977, 'samples': 849600, 'steps': 4424, 'loss/train': 1.7566492557525635} +11/06/2021 21:52:52 - INFO - __main__ - Step 4426: {'lr': 0.0004996688582688711, 'samples': 849792, 'steps': 4425, 'loss/train': 2.2029178142547607} +11/06/2021 21:52:52 - INFO - __main__ - Step 4427: {'lr': 0.0004996685851663477, 'samples': 849984, 'steps': 4426, 'loss/train': 2.1259970664978027} +11/06/2021 21:52:52 - INFO - __main__ - Step 4428: {'lr': 0.0004996683119513274, 'samples': 850176, 'steps': 4427, 'loss/train': 1.6493570804595947} +11/06/2021 21:52:53 - INFO - __main__ - Step 4429: {'lr': 0.0004996680386238103, 'samples': 850368, 'steps': 4428, 'loss/train': 1.9351447820663452} +11/06/2021 21:52:54 - INFO - __main__ - Step 4430: {'lr': 0.0004996677651837967, 'samples': 850560, 'steps': 4429, 'loss/train': 2.663370132446289} +11/06/2021 21:52:54 - INFO - __main__ - Step 4431: {'lr': 0.0004996674916312867, 'samples': 850752, 'steps': 4430, 'loss/train': 2.205284595489502} +11/06/2021 21:52:55 - INFO - __main__ - Step 4432: {'lr': 0.0004996672179662803, 'samples': 850944, 'steps': 4431, 'loss/train': 0.6293364763259888} +11/06/2021 21:52:55 - INFO - __main__ - Step 4433: {'lr': 0.0004996669441887778, 'samples': 851136, 'steps': 4432, 'loss/train': 1.934459924697876} +11/06/2021 21:52:55 - INFO - __main__ - Step 4434: {'lr': 0.0004996666702987791, 'samples': 851328, 'steps': 4433, 'loss/train': 1.715638518333435} +11/06/2021 21:52:56 - INFO - __main__ - Step 4435: {'lr': 0.0004996663962962846, 'samples': 851520, 'steps': 4434, 'loss/train': 2.070112705230713} +11/06/2021 21:52:57 - INFO - __main__ - Step 4436: {'lr': 0.0004996661221812942, 'samples': 851712, 'steps': 4435, 'loss/train': 2.642328977584839} +11/06/2021 21:52:57 - INFO - __main__ - Step 4437: {'lr': 0.0004996658479538081, 'samples': 851904, 'steps': 4436, 'loss/train': 2.1696090698242188} +11/06/2021 21:52:57 - INFO - __main__ - Step 4438: {'lr': 0.0004996655736138265, 'samples': 852096, 'steps': 4437, 'loss/train': 2.149383783340454} +11/06/2021 21:52:58 - INFO - __main__ - Step 4439: {'lr': 0.0004996652991613494, 'samples': 852288, 'steps': 4438, 'loss/train': 1.425952434539795} +11/06/2021 21:52:59 - INFO - __main__ - Step 4440: {'lr': 0.0004996650245963768, 'samples': 852480, 'steps': 4439, 'loss/train': 1.9291316270828247} +11/06/2021 21:53:00 - INFO - __main__ - Step 4441: {'lr': 0.0004996647499189092, 'samples': 852672, 'steps': 4440, 'loss/train': 1.8874024152755737} +11/06/2021 21:53:00 - INFO - __main__ - Step 4442: {'lr': 0.0004996644751289464, 'samples': 852864, 'steps': 4441, 'loss/train': 1.797756552696228} +11/06/2021 21:53:00 - INFO - __main__ - Step 4443: {'lr': 0.0004996642002264887, 'samples': 853056, 'steps': 4442, 'loss/train': 2.348628282546997} +11/06/2021 21:53:01 - INFO - __main__ - Step 4444: {'lr': 0.0004996639252115362, 'samples': 853248, 'steps': 4443, 'loss/train': 1.8861411809921265} +11/06/2021 21:53:01 - INFO - __main__ - Step 4445: {'lr': 0.000499663650084089, 'samples': 853440, 'steps': 4444, 'loss/train': 2.2785558700561523} +11/06/2021 21:53:01 - INFO - __main__ - Step 4446: {'lr': 0.0004996633748441472, 'samples': 853632, 'steps': 4445, 'loss/train': 2.116128444671631} +11/06/2021 21:53:03 - INFO - __main__ - Step 4447: {'lr': 0.0004996630994917108, 'samples': 853824, 'steps': 4446, 'loss/train': 1.9847468137741089} +11/06/2021 21:53:03 - INFO - __main__ - Step 4448: {'lr': 0.0004996628240267802, 'samples': 854016, 'steps': 4447, 'loss/train': 2.634124755859375} +11/06/2021 21:53:03 - INFO - __main__ - Step 4449: {'lr': 0.0004996625484493554, 'samples': 854208, 'steps': 4448, 'loss/train': 1.749208927154541} +11/06/2021 21:53:04 - INFO - __main__ - Step 4450: {'lr': 0.0004996622727594363, 'samples': 854400, 'steps': 4449, 'loss/train': 1.287934422492981} +11/06/2021 21:53:04 - INFO - __main__ - Step 4451: {'lr': 0.0004996619969570234, 'samples': 854592, 'steps': 4450, 'loss/train': 2.1173369884490967} +11/06/2021 21:53:05 - INFO - __main__ - Step 4452: {'lr': 0.0004996617210421166, 'samples': 854784, 'steps': 4451, 'loss/train': 1.4185445308685303} +11/06/2021 21:53:05 - INFO - __main__ - Step 4453: {'lr': 0.0004996614450147161, 'samples': 854976, 'steps': 4452, 'loss/train': 2.3131630420684814} +11/06/2021 21:53:06 - INFO - __main__ - Step 4454: {'lr': 0.0004996611688748221, 'samples': 855168, 'steps': 4453, 'loss/train': 0.5444425940513611} +11/06/2021 21:53:06 - INFO - __main__ - Step 4455: {'lr': 0.0004996608926224345, 'samples': 855360, 'steps': 4454, 'loss/train': 2.0416908264160156} +11/06/2021 21:53:06 - INFO - __main__ - Step 4456: {'lr': 0.0004996606162575536, 'samples': 855552, 'steps': 4455, 'loss/train': 1.4575010538101196} +11/06/2021 21:53:07 - INFO - __main__ - Step 4457: {'lr': 0.0004996603397801795, 'samples': 855744, 'steps': 4456, 'loss/train': 2.1322479248046875} +11/06/2021 21:53:08 - INFO - __main__ - Step 4458: {'lr': 0.0004996600631903123, 'samples': 855936, 'steps': 4457, 'loss/train': 2.1813089847564697} +11/06/2021 21:53:08 - INFO - __main__ - Step 4459: {'lr': 0.0004996597864879521, 'samples': 856128, 'steps': 4458, 'loss/train': 2.2517218589782715} +11/06/2021 21:53:08 - INFO - __main__ - Step 4460: {'lr': 0.000499659509673099, 'samples': 856320, 'steps': 4459, 'loss/train': 2.0033187866210938} +11/06/2021 21:53:09 - INFO - __main__ - Step 4461: {'lr': 0.0004996592327457533, 'samples': 856512, 'steps': 4460, 'loss/train': 1.793095350265503} +11/06/2021 21:53:10 - INFO - __main__ - Step 4462: {'lr': 0.000499658955705915, 'samples': 856704, 'steps': 4461, 'loss/train': 2.264535665512085} +11/06/2021 21:53:10 - INFO - __main__ - Step 4463: {'lr': 0.0004996586785535841, 'samples': 856896, 'steps': 4462, 'loss/train': 2.0258359909057617} +11/06/2021 21:53:11 - INFO - __main__ - Step 4464: {'lr': 0.000499658401288761, 'samples': 857088, 'steps': 4463, 'loss/train': 1.9607642889022827} +11/06/2021 21:53:11 - INFO - __main__ - Step 4465: {'lr': 0.0004996581239114456, 'samples': 857280, 'steps': 4464, 'loss/train': 1.6711504459381104} +11/06/2021 21:53:11 - INFO - __main__ - Step 4466: {'lr': 0.0004996578464216381, 'samples': 857472, 'steps': 4465, 'loss/train': 2.1529288291931152} +11/06/2021 21:53:12 - INFO - __main__ - Step 4467: {'lr': 0.0004996575688193386, 'samples': 857664, 'steps': 4466, 'loss/train': 1.737178087234497} +11/06/2021 21:53:13 - INFO - __main__ - Step 4468: {'lr': 0.0004996572911045473, 'samples': 857856, 'steps': 4467, 'loss/train': 2.233004570007324} +11/06/2021 21:53:13 - INFO - __main__ - Step 4469: {'lr': 0.0004996570132772642, 'samples': 858048, 'steps': 4468, 'loss/train': 1.742701530456543} +11/06/2021 21:53:13 - INFO - __main__ - Step 4470: {'lr': 0.0004996567353374896, 'samples': 858240, 'steps': 4469, 'loss/train': 2.380733013153076} +11/06/2021 21:53:14 - INFO - __main__ - Step 4471: {'lr': 0.0004996564572852235, 'samples': 858432, 'steps': 4470, 'loss/train': 2.0802853107452393} +11/06/2021 21:53:14 - INFO - __main__ - Step 4472: {'lr': 0.000499656179120466, 'samples': 858624, 'steps': 4471, 'loss/train': 1.6092973947525024} +11/06/2021 21:53:15 - INFO - __main__ - Step 4473: {'lr': 0.0004996559008432173, 'samples': 858816, 'steps': 4472, 'loss/train': 3.0951523780822754} +11/06/2021 21:53:16 - INFO - __main__ - Step 4474: {'lr': 0.0004996556224534776, 'samples': 859008, 'steps': 4473, 'loss/train': 2.4669737815856934} +11/06/2021 21:53:16 - INFO - __main__ - Step 4475: {'lr': 0.0004996553439512468, 'samples': 859200, 'steps': 4474, 'loss/train': 2.577219247817993} +11/06/2021 21:53:16 - INFO - __main__ - Step 4476: {'lr': 0.0004996550653365253, 'samples': 859392, 'steps': 4475, 'loss/train': 1.7655971050262451} +11/06/2021 21:53:17 - INFO - __main__ - Step 4477: {'lr': 0.0004996547866093129, 'samples': 859584, 'steps': 4476, 'loss/train': 2.026312828063965} +11/06/2021 21:53:17 - INFO - __main__ - Step 4478: {'lr': 0.00049965450776961, 'samples': 859776, 'steps': 4477, 'loss/train': 2.0732200145721436} +11/06/2021 21:53:18 - INFO - __main__ - Step 4479: {'lr': 0.0004996542288174166, 'samples': 859968, 'steps': 4478, 'loss/train': 2.4320411682128906} +11/06/2021 21:53:18 - INFO - __main__ - Step 4480: {'lr': 0.0004996539497527329, 'samples': 860160, 'steps': 4479, 'loss/train': 1.8877087831497192} +11/06/2021 21:53:19 - INFO - __main__ - Step 4481: {'lr': 0.000499653670575559, 'samples': 860352, 'steps': 4480, 'loss/train': 1.376404047012329} +11/06/2021 21:53:19 - INFO - __main__ - Step 4482: {'lr': 0.0004996533912858949, 'samples': 860544, 'steps': 4481, 'loss/train': 1.817132592201233} +11/06/2021 21:53:19 - INFO - __main__ - Step 4483: {'lr': 0.000499653111883741, 'samples': 860736, 'steps': 4482, 'loss/train': 2.1700544357299805} +11/06/2021 21:53:20 - INFO - __main__ - Step 4484: {'lr': 0.0004996528323690971, 'samples': 860928, 'steps': 4483, 'loss/train': 1.9818646907806396} +11/06/2021 21:53:21 - INFO - __main__ - Step 4485: {'lr': 0.0004996525527419636, 'samples': 861120, 'steps': 4484, 'loss/train': 1.9006667137145996} +11/06/2021 21:53:21 - INFO - __main__ - Step 4486: {'lr': 0.0004996522730023404, 'samples': 861312, 'steps': 4485, 'loss/train': 1.9432722330093384} +11/06/2021 21:53:21 - INFO - __main__ - Step 4487: {'lr': 0.0004996519931502279, 'samples': 861504, 'steps': 4486, 'loss/train': 2.3324050903320312} +11/06/2021 21:53:22 - INFO - __main__ - Step 4488: {'lr': 0.0004996517131856259, 'samples': 861696, 'steps': 4487, 'loss/train': 1.8573492765426636} +11/06/2021 21:53:23 - INFO - __main__ - Step 4489: {'lr': 0.0004996514331085348, 'samples': 861888, 'steps': 4488, 'loss/train': 1.8287177085876465} +11/06/2021 21:53:23 - INFO - __main__ - Step 4490: {'lr': 0.0004996511529189546, 'samples': 862080, 'steps': 4489, 'loss/train': 1.9560521841049194} +11/06/2021 21:53:24 - INFO - __main__ - Step 4491: {'lr': 0.0004996508726168854, 'samples': 862272, 'steps': 4490, 'loss/train': 2.2228381633758545} +11/06/2021 21:53:24 - INFO - __main__ - Step 4492: {'lr': 0.0004996505922023274, 'samples': 862464, 'steps': 4491, 'loss/train': 2.6008143424987793} +11/06/2021 21:53:24 - INFO - __main__ - Step 4493: {'lr': 0.0004996503116752807, 'samples': 862656, 'steps': 4492, 'loss/train': 2.061739206314087} +11/06/2021 21:53:25 - INFO - __main__ - Step 4494: {'lr': 0.0004996500310357454, 'samples': 862848, 'steps': 4493, 'loss/train': 1.7886160612106323} +11/06/2021 21:53:26 - INFO - __main__ - Step 4495: {'lr': 0.0004996497502837217, 'samples': 863040, 'steps': 4494, 'loss/train': 1.68747878074646} +11/06/2021 21:53:26 - INFO - __main__ - Step 4496: {'lr': 0.0004996494694192096, 'samples': 863232, 'steps': 4495, 'loss/train': 1.7942966222763062} +11/06/2021 21:53:26 - INFO - __main__ - Step 4497: {'lr': 0.0004996491884422092, 'samples': 863424, 'steps': 4496, 'loss/train': 2.276155948638916} +11/06/2021 21:53:27 - INFO - __main__ - Step 4498: {'lr': 0.0004996489073527208, 'samples': 863616, 'steps': 4497, 'loss/train': 2.0408365726470947} +11/06/2021 21:53:28 - INFO - __main__ - Step 4499: {'lr': 0.0004996486261507445, 'samples': 863808, 'steps': 4498, 'loss/train': 2.200601816177368} +11/06/2021 21:53:28 - INFO - __main__ - Step 4500: {'lr': 0.0004996483448362805, 'samples': 864000, 'steps': 4499, 'loss/train': 2.0834293365478516} +11/06/2021 21:53:28 - INFO - __main__ - Step 4501: {'lr': 0.0004996480634093287, 'samples': 864192, 'steps': 4500, 'loss/train': 1.751892328262329} +11/06/2021 21:53:29 - INFO - __main__ - Step 4502: {'lr': 0.0004996477818698893, 'samples': 864384, 'steps': 4501, 'loss/train': 2.13613224029541} +11/06/2021 21:53:29 - INFO - __main__ - Step 4503: {'lr': 0.0004996475002179625, 'samples': 864576, 'steps': 4502, 'loss/train': 2.1853764057159424} +11/06/2021 21:53:30 - INFO - __main__ - Step 4504: {'lr': 0.0004996472184535484, 'samples': 864768, 'steps': 4503, 'loss/train': 1.418428659439087} +11/06/2021 21:53:30 - INFO - __main__ - Step 4505: {'lr': 0.0004996469365766471, 'samples': 864960, 'steps': 4504, 'loss/train': 1.7238401174545288} +11/06/2021 21:53:31 - INFO - __main__ - Step 4506: {'lr': 0.0004996466545872588, 'samples': 865152, 'steps': 4505, 'loss/train': 1.999024510383606} +11/06/2021 21:53:31 - INFO - __main__ - Step 4507: {'lr': 0.0004996463724853834, 'samples': 865344, 'steps': 4506, 'loss/train': 2.0768072605133057} +11/06/2021 21:53:31 - INFO - __main__ - Step 4508: {'lr': 0.0004996460902710214, 'samples': 865536, 'steps': 4507, 'loss/train': 1.8393359184265137} +11/06/2021 21:53:32 - INFO - __main__ - Step 4509: {'lr': 0.0004996458079441727, 'samples': 865728, 'steps': 4508, 'loss/train': 1.8585339784622192} +11/06/2021 21:53:33 - INFO - __main__ - Step 4510: {'lr': 0.0004996455255048373, 'samples': 865920, 'steps': 4509, 'loss/train': 1.3014329671859741} +11/06/2021 21:53:33 - INFO - __main__ - Step 4511: {'lr': 0.0004996452429530156, 'samples': 866112, 'steps': 4510, 'loss/train': 2.1434712409973145} +11/06/2021 21:53:33 - INFO - __main__ - Step 4512: {'lr': 0.0004996449602887075, 'samples': 866304, 'steps': 4511, 'loss/train': 1.680091142654419} +11/06/2021 21:53:34 - INFO - __main__ - Step 4513: {'lr': 0.0004996446775119134, 'samples': 866496, 'steps': 4512, 'loss/train': 1.8141558170318604} +11/06/2021 21:53:35 - INFO - __main__ - Step 4514: {'lr': 0.0004996443946226331, 'samples': 866688, 'steps': 4513, 'loss/train': 1.9032708406448364} +11/06/2021 21:53:35 - INFO - __main__ - Step 4515: {'lr': 0.000499644111620867, 'samples': 866880, 'steps': 4514, 'loss/train': 1.6730246543884277} +11/06/2021 21:53:36 - INFO - __main__ - Step 4516: {'lr': 0.000499643828506615, 'samples': 867072, 'steps': 4515, 'loss/train': 2.1784026622772217} +11/06/2021 21:53:36 - INFO - __main__ - Step 4517: {'lr': 0.0004996435452798775, 'samples': 867264, 'steps': 4516, 'loss/train': 1.8776859045028687} +11/06/2021 21:53:36 - INFO - __main__ - Step 4518: {'lr': 0.0004996432619406543, 'samples': 867456, 'steps': 4517, 'loss/train': 2.0420169830322266} +11/06/2021 21:53:37 - INFO - __main__ - Step 4519: {'lr': 0.0004996429784889458, 'samples': 867648, 'steps': 4518, 'loss/train': 2.412881851196289} +11/06/2021 21:53:38 - INFO - __main__ - Step 4520: {'lr': 0.000499642694924752, 'samples': 867840, 'steps': 4519, 'loss/train': 1.9957324266433716} +11/06/2021 21:53:38 - INFO - __main__ - Step 4521: {'lr': 0.000499642411248073, 'samples': 868032, 'steps': 4520, 'loss/train': 1.6232712268829346} +11/06/2021 21:53:38 - INFO - __main__ - Step 4522: {'lr': 0.0004996421274589091, 'samples': 868224, 'steps': 4521, 'loss/train': 2.311401128768921} +11/06/2021 21:53:39 - INFO - __main__ - Step 4523: {'lr': 0.0004996418435572603, 'samples': 868416, 'steps': 4522, 'loss/train': 2.561228036880493} +11/06/2021 21:53:39 - INFO - __main__ - Step 4524: {'lr': 0.0004996415595431267, 'samples': 868608, 'steps': 4523, 'loss/train': 2.3829054832458496} +11/06/2021 21:53:40 - INFO - __main__ - Step 4525: {'lr': 0.0004996412754165084, 'samples': 868800, 'steps': 4524, 'loss/train': 1.9954290390014648} +11/06/2021 21:53:40 - INFO - __main__ - Step 4526: {'lr': 0.0004996409911774056, 'samples': 868992, 'steps': 4525, 'loss/train': 1.9752427339553833} +11/06/2021 21:53:41 - INFO - __main__ - Step 4527: {'lr': 0.0004996407068258186, 'samples': 869184, 'steps': 4526, 'loss/train': 2.2408523559570312} +11/06/2021 21:53:41 - INFO - __main__ - Step 4528: {'lr': 0.0004996404223617471, 'samples': 869376, 'steps': 4527, 'loss/train': 1.6397135257720947} +11/06/2021 21:53:41 - INFO - __main__ - Step 4529: {'lr': 0.0004996401377851917, 'samples': 869568, 'steps': 4528, 'loss/train': 2.1448097229003906} +11/06/2021 21:53:42 - INFO - __main__ - Step 4530: {'lr': 0.0004996398530961522, 'samples': 869760, 'steps': 4529, 'loss/train': 1.8006598949432373} +11/06/2021 21:53:43 - INFO - __main__ - Step 4531: {'lr': 0.0004996395682946288, 'samples': 869952, 'steps': 4530, 'loss/train': 1.2451746463775635} +11/06/2021 21:53:43 - INFO - __main__ - Step 4532: {'lr': 0.0004996392833806217, 'samples': 870144, 'steps': 4531, 'loss/train': 1.7764043807983398} +11/06/2021 21:53:44 - INFO - __main__ - Step 4533: {'lr': 0.000499638998354131, 'samples': 870336, 'steps': 4532, 'loss/train': 2.118048667907715} +11/06/2021 21:53:44 - INFO - __main__ - Step 4534: {'lr': 0.0004996387132151567, 'samples': 870528, 'steps': 4533, 'loss/train': 2.315908908843994} +11/06/2021 21:53:45 - INFO - __main__ - Step 4535: {'lr': 0.0004996384279636993, 'samples': 870720, 'steps': 4534, 'loss/train': 2.341172218322754} +11/06/2021 21:53:45 - INFO - __main__ - Step 4536: {'lr': 0.0004996381425997584, 'samples': 870912, 'steps': 4535, 'loss/train': 2.5195581912994385} +11/06/2021 21:53:46 - INFO - __main__ - Step 4537: {'lr': 0.0004996378571233347, 'samples': 871104, 'steps': 4536, 'loss/train': 2.251058578491211} +11/06/2021 21:53:46 - INFO - __main__ - Step 4538: {'lr': 0.0004996375715344278, 'samples': 871296, 'steps': 4537, 'loss/train': 2.1683661937713623} +11/06/2021 21:53:46 - INFO - __main__ - Step 4539: {'lr': 0.0004996372858330382, 'samples': 871488, 'steps': 4538, 'loss/train': 2.623131275177002} +11/06/2021 21:53:47 - INFO - __main__ - Step 4540: {'lr': 0.0004996370000191657, 'samples': 871680, 'steps': 4539, 'loss/train': 2.218451738357544} +11/06/2021 21:53:48 - INFO - __main__ - Step 4541: {'lr': 0.0004996367140928107, 'samples': 871872, 'steps': 4540, 'loss/train': 2.884366989135742} +11/06/2021 21:53:48 - INFO - __main__ - Step 4542: {'lr': 0.0004996364280539734, 'samples': 872064, 'steps': 4541, 'loss/train': 2.3906033039093018} +11/06/2021 21:53:48 - INFO - __main__ - Step 4543: {'lr': 0.0004996361419026537, 'samples': 872256, 'steps': 4542, 'loss/train': 2.0911548137664795} +11/06/2021 21:53:49 - INFO - __main__ - Step 4544: {'lr': 0.0004996358556388518, 'samples': 872448, 'steps': 4543, 'loss/train': 2.255887269973755} +11/06/2021 21:53:49 - INFO - __main__ - Step 4545: {'lr': 0.0004996355692625678, 'samples': 872640, 'steps': 4544, 'loss/train': 2.3875391483306885} +11/06/2021 21:53:50 - INFO - __main__ - Step 4546: {'lr': 0.0004996352827738018, 'samples': 872832, 'steps': 4545, 'loss/train': 1.9046090841293335} +11/06/2021 21:53:50 - INFO - __main__ - Step 4547: {'lr': 0.0004996349961725542, 'samples': 873024, 'steps': 4546, 'loss/train': 1.6704214811325073} +11/06/2021 21:53:51 - INFO - __main__ - Step 4548: {'lr': 0.0004996347094588247, 'samples': 873216, 'steps': 4547, 'loss/train': 1.5265803337097168} +11/06/2021 21:53:51 - INFO - __main__ - Step 4549: {'lr': 0.0004996344226326137, 'samples': 873408, 'steps': 4548, 'loss/train': 2.1202685832977295} +11/06/2021 21:53:52 - INFO - __main__ - Step 4550: {'lr': 0.0004996341356939214, 'samples': 873600, 'steps': 4549, 'loss/train': 2.068074941635132} +11/06/2021 21:53:53 - INFO - __main__ - Step 4551: {'lr': 0.0004996338486427477, 'samples': 873792, 'steps': 4550, 'loss/train': 2.596259593963623} +11/06/2021 21:53:53 - INFO - __main__ - Step 4552: {'lr': 0.0004996335614790929, 'samples': 873984, 'steps': 4551, 'loss/train': 1.9318180084228516} +11/06/2021 21:53:53 - INFO - __main__ - Step 4553: {'lr': 0.0004996332742029571, 'samples': 874176, 'steps': 4552, 'loss/train': 1.7639127969741821} +11/06/2021 21:53:54 - INFO - __main__ - Step 4554: {'lr': 0.0004996329868143404, 'samples': 874368, 'steps': 4553, 'loss/train': 2.062023639678955} +11/06/2021 21:53:54 - INFO - __main__ - Step 4555: {'lr': 0.0004996326993132428, 'samples': 874560, 'steps': 4554, 'loss/train': 2.341677665710449} +11/06/2021 21:53:55 - INFO - __main__ - Step 4556: {'lr': 0.0004996324116996647, 'samples': 874752, 'steps': 4555, 'loss/train': 1.2803831100463867} +11/06/2021 21:53:55 - INFO - __main__ - Step 4557: {'lr': 0.0004996321239736059, 'samples': 874944, 'steps': 4556, 'loss/train': 1.2265723943710327} +11/06/2021 21:53:56 - INFO - __main__ - Step 4558: {'lr': 0.000499631836135067, 'samples': 875136, 'steps': 4557, 'loss/train': 1.5673511028289795} +11/06/2021 21:53:56 - INFO - __main__ - Step 4559: {'lr': 0.0004996315481840476, 'samples': 875328, 'steps': 4558, 'loss/train': 2.2120308876037598} +11/06/2021 21:53:56 - INFO - __main__ - Step 4560: {'lr': 0.0004996312601205482, 'samples': 875520, 'steps': 4559, 'loss/train': 1.771849513053894} +11/06/2021 21:53:57 - INFO - __main__ - Step 4561: {'lr': 0.0004996309719445687, 'samples': 875712, 'steps': 4560, 'loss/train': 1.6283718347549438} +11/06/2021 21:53:58 - INFO - __main__ - Step 4562: {'lr': 0.0004996306836561094, 'samples': 875904, 'steps': 4561, 'loss/train': 2.1488685607910156} +11/06/2021 21:53:58 - INFO - __main__ - Step 4563: {'lr': 0.0004996303952551704, 'samples': 876096, 'steps': 4562, 'loss/train': 3.6791834831237793} +11/06/2021 21:53:58 - INFO - __main__ - Step 4564: {'lr': 0.0004996301067417517, 'samples': 876288, 'steps': 4563, 'loss/train': 1.914914846420288} +11/06/2021 21:53:59 - INFO - __main__ - Step 4565: {'lr': 0.0004996298181158536, 'samples': 876480, 'steps': 4564, 'loss/train': 2.1919569969177246} +11/06/2021 21:53:59 - INFO - __main__ - Step 4566: {'lr': 0.0004996295293774762, 'samples': 876672, 'steps': 4565, 'loss/train': 2.0341947078704834} +11/06/2021 21:54:00 - INFO - __main__ - Step 4567: {'lr': 0.0004996292405266195, 'samples': 876864, 'steps': 4566, 'loss/train': 3.0565133094787598} +11/06/2021 21:54:01 - INFO - __main__ - Step 4568: {'lr': 0.0004996289515632838, 'samples': 877056, 'steps': 4567, 'loss/train': 1.6455254554748535} +11/06/2021 21:54:01 - INFO - __main__ - Step 4569: {'lr': 0.0004996286624874691, 'samples': 877248, 'steps': 4568, 'loss/train': 2.0319526195526123} +11/06/2021 21:54:01 - INFO - __main__ - Step 4570: {'lr': 0.0004996283732991755, 'samples': 877440, 'steps': 4569, 'loss/train': 2.2277791500091553} +11/06/2021 21:54:02 - INFO - __main__ - Step 4571: {'lr': 0.0004996280839984033, 'samples': 877632, 'steps': 4570, 'loss/train': 1.485971450805664} +11/06/2021 21:54:03 - INFO - __main__ - Step 4572: {'lr': 0.0004996277945851525, 'samples': 877824, 'steps': 4571, 'loss/train': 2.180328369140625} +11/06/2021 21:54:03 - INFO - __main__ - Step 4573: {'lr': 0.0004996275050594233, 'samples': 878016, 'steps': 4572, 'loss/train': 1.8692883253097534} +11/06/2021 21:54:03 - INFO - __main__ - Step 4574: {'lr': 0.0004996272154212158, 'samples': 878208, 'steps': 4573, 'loss/train': 0.9339056611061096} +11/06/2021 21:54:04 - INFO - __main__ - Step 4575: {'lr': 0.0004996269256705301, 'samples': 878400, 'steps': 4574, 'loss/train': 2.103940486907959} +11/06/2021 21:54:04 - INFO - __main__ - Step 4576: {'lr': 0.0004996266358073664, 'samples': 878592, 'steps': 4575, 'loss/train': 1.7924268245697021} +11/06/2021 21:54:05 - INFO - __main__ - Step 4577: {'lr': 0.0004996263458317248, 'samples': 878784, 'steps': 4576, 'loss/train': 1.6914095878601074} +11/06/2021 21:54:05 - INFO - __main__ - Step 4578: {'lr': 0.0004996260557436053, 'samples': 878976, 'steps': 4577, 'loss/train': 1.528101921081543} +11/06/2021 21:54:06 - INFO - __main__ - Step 4579: {'lr': 0.0004996257655430083, 'samples': 879168, 'steps': 4578, 'loss/train': 1.8863238096237183} +11/06/2021 21:54:06 - INFO - __main__ - Step 4580: {'lr': 0.0004996254752299337, 'samples': 879360, 'steps': 4579, 'loss/train': 1.8763165473937988} +11/06/2021 21:54:06 - INFO - __main__ - Step 4581: {'lr': 0.0004996251848043817, 'samples': 879552, 'steps': 4580, 'loss/train': 1.885318636894226} +11/06/2021 21:54:07 - INFO - __main__ - Step 4582: {'lr': 0.0004996248942663525, 'samples': 879744, 'steps': 4581, 'loss/train': 1.8357065916061401} +11/06/2021 21:54:08 - INFO - __main__ - Step 4583: {'lr': 0.000499624603615846, 'samples': 879936, 'steps': 4582, 'loss/train': 1.8866019248962402} +11/06/2021 21:54:08 - INFO - __main__ - Step 4584: {'lr': 0.0004996243128528628, 'samples': 880128, 'steps': 4583, 'loss/train': 2.051255464553833} +11/06/2021 21:54:08 - INFO - __main__ - Step 4585: {'lr': 0.0004996240219774025, 'samples': 880320, 'steps': 4584, 'loss/train': 1.9675004482269287} +11/06/2021 21:54:09 - INFO - __main__ - Step 4586: {'lr': 0.0004996237309894656, 'samples': 880512, 'steps': 4585, 'loss/train': 2.283939838409424} +11/06/2021 21:54:10 - INFO - __main__ - Step 4587: {'lr': 0.0004996234398890521, 'samples': 880704, 'steps': 4586, 'loss/train': 1.3432775735855103} +11/06/2021 21:54:10 - INFO - __main__ - Step 4588: {'lr': 0.000499623148676162, 'samples': 880896, 'steps': 4587, 'loss/train': 2.1022074222564697} +11/06/2021 21:54:10 - INFO - __main__ - Step 4589: {'lr': 0.0004996228573507957, 'samples': 881088, 'steps': 4588, 'loss/train': 2.6343271732330322} +11/06/2021 21:54:11 - INFO - __main__ - Step 4590: {'lr': 0.0004996225659129531, 'samples': 881280, 'steps': 4589, 'loss/train': 1.8193244934082031} +11/06/2021 21:54:11 - INFO - __main__ - Step 4591: {'lr': 0.0004996222743626345, 'samples': 881472, 'steps': 4590, 'loss/train': 2.7049386501312256} +11/06/2021 21:54:12 - INFO - __main__ - Step 4592: {'lr': 0.0004996219826998399, 'samples': 881664, 'steps': 4591, 'loss/train': 2.1974246501922607} +11/06/2021 21:54:13 - INFO - __main__ - Step 4593: {'lr': 0.0004996216909245695, 'samples': 881856, 'steps': 4592, 'loss/train': 2.143535852432251} +11/06/2021 21:54:13 - INFO - __main__ - Step 4594: {'lr': 0.0004996213990368234, 'samples': 882048, 'steps': 4593, 'loss/train': 2.2130115032196045} +11/06/2021 21:54:13 - INFO - __main__ - Step 4595: {'lr': 0.0004996211070366018, 'samples': 882240, 'steps': 4594, 'loss/train': 2.191429376602173} +11/06/2021 21:54:14 - INFO - __main__ - Step 4596: {'lr': 0.0004996208149239047, 'samples': 882432, 'steps': 4595, 'loss/train': 2.114386558532715} +11/06/2021 21:54:14 - INFO - __main__ - Step 4597: {'lr': 0.0004996205226987324, 'samples': 882624, 'steps': 4596, 'loss/train': 1.8462443351745605} +11/06/2021 21:54:15 - INFO - __main__ - Step 4598: {'lr': 0.0004996202303610849, 'samples': 882816, 'steps': 4597, 'loss/train': 1.8497729301452637} +11/06/2021 21:54:15 - INFO - __main__ - Step 4599: {'lr': 0.0004996199379109624, 'samples': 883008, 'steps': 4598, 'loss/train': 1.8294633626937866} +11/06/2021 21:54:16 - INFO - __main__ - Step 4600: {'lr': 0.000499619645348365, 'samples': 883200, 'steps': 4599, 'loss/train': 2.2398879528045654} +11/06/2021 21:54:16 - INFO - __main__ - Step 4601: {'lr': 0.0004996193526732929, 'samples': 883392, 'steps': 4600, 'loss/train': 2.352756977081299} +11/06/2021 21:54:16 - INFO - __main__ - Step 4602: {'lr': 0.0004996190598857461, 'samples': 883584, 'steps': 4601, 'loss/train': 1.9614698886871338} +11/06/2021 21:54:17 - INFO - __main__ - Step 4603: {'lr': 0.0004996187669857247, 'samples': 883776, 'steps': 4602, 'loss/train': 1.7905255556106567} +11/06/2021 21:54:18 - INFO - __main__ - Step 4604: {'lr': 0.0004996184739732291, 'samples': 883968, 'steps': 4603, 'loss/train': 2.1833322048187256} +11/06/2021 21:54:18 - INFO - __main__ - Step 4605: {'lr': 0.0004996181808482592, 'samples': 884160, 'steps': 4604, 'loss/train': 1.840651035308838} +11/06/2021 21:54:18 - INFO - __main__ - Step 4606: {'lr': 0.0004996178876108152, 'samples': 884352, 'steps': 4605, 'loss/train': 1.8321231603622437} +11/06/2021 21:54:19 - INFO - __main__ - Step 4607: {'lr': 0.0004996175942608973, 'samples': 884544, 'steps': 4606, 'loss/train': 2.244662284851074} +11/06/2021 21:54:20 - INFO - __main__ - Step 4608: {'lr': 0.0004996173007985055, 'samples': 884736, 'steps': 4607, 'loss/train': 1.933355689048767} +11/06/2021 21:54:20 - INFO - __main__ - Step 4609: {'lr': 0.00049961700722364, 'samples': 884928, 'steps': 4608, 'loss/train': 1.835882306098938} +11/06/2021 21:54:21 - INFO - __main__ - Step 4610: {'lr': 0.0004996167135363009, 'samples': 885120, 'steps': 4609, 'loss/train': 0.5920076966285706} +11/06/2021 21:54:21 - INFO - __main__ - Step 4611: {'lr': 0.0004996164197364884, 'samples': 885312, 'steps': 4610, 'loss/train': 2.2849209308624268} +11/06/2021 21:54:21 - INFO - __main__ - Step 4612: {'lr': 0.0004996161258242025, 'samples': 885504, 'steps': 4611, 'loss/train': 2.7224349975585938} +11/06/2021 21:54:22 - INFO - __main__ - Step 4613: {'lr': 0.0004996158317994436, 'samples': 885696, 'steps': 4612, 'loss/train': 2.293109893798828} +11/06/2021 21:54:23 - INFO - __main__ - Step 4614: {'lr': 0.0004996155376622115, 'samples': 885888, 'steps': 4613, 'loss/train': 2.077742099761963} +11/06/2021 21:54:23 - INFO - __main__ - Step 4615: {'lr': 0.0004996152434125066, 'samples': 886080, 'steps': 4614, 'loss/train': 2.129293441772461} +11/06/2021 21:54:23 - INFO - __main__ - Step 4616: {'lr': 0.0004996149490503289, 'samples': 886272, 'steps': 4615, 'loss/train': 1.7415257692337036} +11/06/2021 21:54:24 - INFO - __main__ - Step 4617: {'lr': 0.0004996146545756786, 'samples': 886464, 'steps': 4616, 'loss/train': 1.9531595706939697} +11/06/2021 21:54:25 - INFO - __main__ - Step 4618: {'lr': 0.0004996143599885557, 'samples': 886656, 'steps': 4617, 'loss/train': 2.034966468811035} +11/06/2021 21:54:25 - INFO - __main__ - Step 4619: {'lr': 0.0004996140652889603, 'samples': 886848, 'steps': 4618, 'loss/train': 1.855339765548706} +11/06/2021 21:54:25 - INFO - __main__ - Step 4620: {'lr': 0.0004996137704768929, 'samples': 887040, 'steps': 4619, 'loss/train': 2.010745048522949} +11/06/2021 21:54:26 - INFO - __main__ - Step 4621: {'lr': 0.0004996134755523532, 'samples': 887232, 'steps': 4620, 'loss/train': 1.572229027748108} +11/06/2021 21:54:26 - INFO - __main__ - Step 4622: {'lr': 0.0004996131805153417, 'samples': 887424, 'steps': 4621, 'loss/train': 2.434321880340576} +11/06/2021 21:54:27 - INFO - __main__ - Step 4623: {'lr': 0.0004996128853658583, 'samples': 887616, 'steps': 4622, 'loss/train': 1.803308129310608} +11/06/2021 21:54:27 - INFO - __main__ - Step 4624: {'lr': 0.0004996125901039031, 'samples': 887808, 'steps': 4623, 'loss/train': 2.078205108642578} +11/06/2021 21:54:28 - INFO - __main__ - Step 4625: {'lr': 0.0004996122947294764, 'samples': 888000, 'steps': 4624, 'loss/train': 1.3897693157196045} +11/06/2021 21:54:28 - INFO - __main__ - Step 4626: {'lr': 0.0004996119992425782, 'samples': 888192, 'steps': 4625, 'loss/train': 2.1612305641174316} +11/06/2021 21:54:28 - INFO - __main__ - Step 4627: {'lr': 0.0004996117036432087, 'samples': 888384, 'steps': 4626, 'loss/train': 1.204795479774475} +11/06/2021 21:54:29 - INFO - __main__ - Step 4628: {'lr': 0.000499611407931368, 'samples': 888576, 'steps': 4627, 'loss/train': 1.87538480758667} +11/06/2021 21:54:30 - INFO - __main__ - Step 4629: {'lr': 0.0004996111121070562, 'samples': 888768, 'steps': 4628, 'loss/train': 1.9798368215560913} +11/06/2021 21:54:30 - INFO - __main__ - Step 4630: {'lr': 0.0004996108161702736, 'samples': 888960, 'steps': 4629, 'loss/train': 1.8879029750823975} +11/06/2021 21:54:30 - INFO - __main__ - Step 4631: {'lr': 0.0004996105201210202, 'samples': 889152, 'steps': 4630, 'loss/train': 1.498540997505188} +11/06/2021 21:54:31 - INFO - __main__ - Step 4632: {'lr': 0.0004996102239592961, 'samples': 889344, 'steps': 4631, 'loss/train': 2.450267791748047} +11/06/2021 21:54:31 - INFO - __main__ - Step 4633: {'lr': 0.0004996099276851015, 'samples': 889536, 'steps': 4632, 'loss/train': 1.960253357887268} +11/06/2021 21:54:32 - INFO - __main__ - Step 4634: {'lr': 0.0004996096312984365, 'samples': 889728, 'steps': 4633, 'loss/train': 2.13409423828125} +11/06/2021 21:54:33 - INFO - __main__ - Step 4635: {'lr': 0.0004996093347993013, 'samples': 889920, 'steps': 4634, 'loss/train': 2.0862467288970947} +11/06/2021 21:54:33 - INFO - __main__ - Step 4636: {'lr': 0.000499609038187696, 'samples': 890112, 'steps': 4635, 'loss/train': 1.7066518068313599} +11/06/2021 21:54:33 - INFO - __main__ - Step 4637: {'lr': 0.0004996087414636207, 'samples': 890304, 'steps': 4636, 'loss/train': 1.917240858078003} +11/06/2021 21:54:34 - INFO - __main__ - Step 4638: {'lr': 0.0004996084446270755, 'samples': 890496, 'steps': 4637, 'loss/train': 1.5188076496124268} +11/06/2021 21:54:35 - INFO - __main__ - Step 4639: {'lr': 0.0004996081476780607, 'samples': 890688, 'steps': 4638, 'loss/train': 2.3080358505249023} +11/06/2021 21:54:35 - INFO - __main__ - Step 4640: {'lr': 0.0004996078506165762, 'samples': 890880, 'steps': 4639, 'loss/train': 1.5977153778076172} +11/06/2021 21:54:35 - INFO - __main__ - Step 4641: {'lr': 0.0004996075534426222, 'samples': 891072, 'steps': 4640, 'loss/train': 1.9571729898452759} +11/06/2021 21:54:36 - INFO - __main__ - Step 4642: {'lr': 0.000499607256156199, 'samples': 891264, 'steps': 4641, 'loss/train': 1.8053956031799316} +11/06/2021 21:54:36 - INFO - __main__ - Step 4643: {'lr': 0.0004996069587573067, 'samples': 891456, 'steps': 4642, 'loss/train': 1.5705664157867432} +11/06/2021 21:54:37 - INFO - __main__ - Step 4644: {'lr': 0.0004996066612459452, 'samples': 891648, 'steps': 4643, 'loss/train': 1.735826849937439} +11/06/2021 21:54:37 - INFO - __main__ - Step 4645: {'lr': 0.0004996063636221148, 'samples': 891840, 'steps': 4644, 'loss/train': 2.2214009761810303} +11/06/2021 21:54:38 - INFO - __main__ - Step 4646: {'lr': 0.0004996060658858158, 'samples': 892032, 'steps': 4645, 'loss/train': 2.121854305267334} +11/06/2021 21:54:38 - INFO - __main__ - Step 4647: {'lr': 0.000499605768037048, 'samples': 892224, 'steps': 4646, 'loss/train': 2.353457450866699} +11/06/2021 21:54:39 - INFO - __main__ - Step 4648: {'lr': 0.0004996054700758117, 'samples': 892416, 'steps': 4647, 'loss/train': 2.0667355060577393} +11/06/2021 21:54:40 - INFO - __main__ - Step 4649: {'lr': 0.0004996051720021071, 'samples': 892608, 'steps': 4648, 'loss/train': 2.009962558746338} +11/06/2021 21:54:40 - INFO - __main__ - Step 4650: {'lr': 0.0004996048738159342, 'samples': 892800, 'steps': 4649, 'loss/train': 0.5192378163337708} +11/06/2021 21:54:40 - INFO - __main__ - Step 4651: {'lr': 0.0004996045755172932, 'samples': 892992, 'steps': 4650, 'loss/train': 1.84172785282135} +11/06/2021 21:54:41 - INFO - __main__ - Step 4652: {'lr': 0.0004996042771061843, 'samples': 893184, 'steps': 4651, 'loss/train': 2.217998504638672} +11/06/2021 21:54:41 - INFO - __main__ - Step 4653: {'lr': 0.0004996039785826075, 'samples': 893376, 'steps': 4652, 'loss/train': 1.648202657699585} +11/06/2021 21:54:42 - INFO - __main__ - Step 4654: {'lr': 0.000499603679946563, 'samples': 893568, 'steps': 4653, 'loss/train': 2.03910756111145} +11/06/2021 21:54:43 - INFO - __main__ - Step 4655: {'lr': 0.0004996033811980509, 'samples': 893760, 'steps': 4654, 'loss/train': 1.7975298166275024} +11/06/2021 21:54:43 - INFO - __main__ - Step 4656: {'lr': 0.0004996030823370715, 'samples': 893952, 'steps': 4655, 'loss/train': 1.8534296751022339} +11/06/2021 21:54:43 - INFO - __main__ - Step 4657: {'lr': 0.0004996027833636247, 'samples': 894144, 'steps': 4656, 'loss/train': 2.475618600845337} +11/06/2021 21:54:44 - INFO - __main__ - Step 4658: {'lr': 0.0004996024842777106, 'samples': 894336, 'steps': 4657, 'loss/train': 1.9979157447814941} +11/06/2021 21:54:44 - INFO - __main__ - Step 4659: {'lr': 0.0004996021850793297, 'samples': 894528, 'steps': 4658, 'loss/train': 2.030845880508423} +11/06/2021 21:54:45 - INFO - __main__ - Step 4660: {'lr': 0.0004996018857684818, 'samples': 894720, 'steps': 4659, 'loss/train': 2.158336877822876} +11/06/2021 21:54:45 - INFO - __main__ - Step 4661: {'lr': 0.0004996015863451672, 'samples': 894912, 'steps': 4660, 'loss/train': 1.8965908288955688} +11/06/2021 21:54:46 - INFO - __main__ - Step 4662: {'lr': 0.0004996012868093859, 'samples': 895104, 'steps': 4661, 'loss/train': 2.2160189151763916} +11/06/2021 21:54:46 - INFO - __main__ - Step 4663: {'lr': 0.0004996009871611382, 'samples': 895296, 'steps': 4662, 'loss/train': 2.1121556758880615} +11/06/2021 21:54:46 - INFO - __main__ - Step 4664: {'lr': 0.0004996006874004241, 'samples': 895488, 'steps': 4663, 'loss/train': 1.954535961151123} +11/06/2021 21:54:49 - INFO - __main__ - Step 4665: {'lr': 0.0004996003875272438, 'samples': 895680, 'steps': 4664, 'loss/train': 1.9362295866012573} +11/06/2021 21:54:49 - INFO - __main__ - Step 4666: {'lr': 0.0004996000875415973, 'samples': 895872, 'steps': 4665, 'loss/train': 1.841673731803894} +11/06/2021 21:54:50 - INFO - __main__ - Step 4667: {'lr': 0.000499599787443485, 'samples': 896064, 'steps': 4666, 'loss/train': 1.7296624183654785} +11/06/2021 21:54:50 - INFO - __main__ - Step 4668: {'lr': 0.0004995994872329069, 'samples': 896256, 'steps': 4667, 'loss/train': 2.1744236946105957} +11/06/2021 21:54:50 - INFO - __main__ - Step 4669: {'lr': 0.000499599186909863, 'samples': 896448, 'steps': 4668, 'loss/train': 2.424499273300171} +11/06/2021 21:54:51 - INFO - __main__ - Step 4670: {'lr': 0.0004995988864743536, 'samples': 896640, 'steps': 4669, 'loss/train': 2.350759744644165} +11/06/2021 21:54:51 - INFO - __main__ - Step 4671: {'lr': 0.0004995985859263789, 'samples': 896832, 'steps': 4670, 'loss/train': 1.975557804107666} +11/06/2021 21:54:51 - INFO - __main__ - Step 4672: {'lr': 0.0004995982852659388, 'samples': 897024, 'steps': 4671, 'loss/train': 2.1741600036621094} +11/06/2021 21:54:52 - INFO - __main__ - Step 4673: {'lr': 0.0004995979844930336, 'samples': 897216, 'steps': 4672, 'loss/train': 2.133139133453369} +11/06/2021 21:54:53 - INFO - __main__ - Step 4674: {'lr': 0.0004995976836076635, 'samples': 897408, 'steps': 4673, 'loss/train': 2.012343168258667} +11/06/2021 21:54:53 - INFO - __main__ - Step 4675: {'lr': 0.0004995973826098283, 'samples': 897600, 'steps': 4674, 'loss/train': 1.9310002326965332} +11/06/2021 21:54:53 - INFO - __main__ - Step 4676: {'lr': 0.0004995970814995285, 'samples': 897792, 'steps': 4675, 'loss/train': 1.969705581665039} +11/06/2021 21:54:54 - INFO - __main__ - Step 4677: {'lr': 0.0004995967802767641, 'samples': 897984, 'steps': 4676, 'loss/train': 0.5457145571708679} +11/06/2021 21:54:55 - INFO - __main__ - Step 4678: {'lr': 0.0004995964789415353, 'samples': 898176, 'steps': 4677, 'loss/train': 2.1169257164001465} +11/06/2021 21:54:55 - INFO - __main__ - Step 4679: {'lr': 0.0004995961774938423, 'samples': 898368, 'steps': 4678, 'loss/train': 2.047304630279541} +11/06/2021 21:54:56 - INFO - __main__ - Step 4680: {'lr': 0.0004995958759336849, 'samples': 898560, 'steps': 4679, 'loss/train': 2.2334115505218506} +11/06/2021 21:54:56 - INFO - __main__ - Step 4681: {'lr': 0.0004995955742610635, 'samples': 898752, 'steps': 4680, 'loss/train': 1.9930462837219238} +11/06/2021 21:54:56 - INFO - __main__ - Step 4682: {'lr': 0.0004995952724759781, 'samples': 898944, 'steps': 4681, 'loss/train': 2.6837527751922607} +11/06/2021 21:54:57 - INFO - __main__ - Step 4683: {'lr': 0.0004995949705784291, 'samples': 899136, 'steps': 4682, 'loss/train': 2.2613110542297363} +11/06/2021 21:54:58 - INFO - __main__ - Step 4684: {'lr': 0.0004995946685684164, 'samples': 899328, 'steps': 4683, 'loss/train': 1.6057881116867065} +11/06/2021 21:54:58 - INFO - __main__ - Step 4685: {'lr': 0.0004995943664459401, 'samples': 899520, 'steps': 4684, 'loss/train': 4.826809406280518} +11/06/2021 21:54:58 - INFO - __main__ - Step 4686: {'lr': 0.0004995940642110005, 'samples': 899712, 'steps': 4685, 'loss/train': 2.056427478790283} +11/06/2021 21:54:59 - INFO - __main__ - Step 4687: {'lr': 0.0004995937618635977, 'samples': 899904, 'steps': 4686, 'loss/train': 2.5549728870391846} +11/06/2021 21:55:00 - INFO - __main__ - Step 4688: {'lr': 0.0004995934594037316, 'samples': 900096, 'steps': 4687, 'loss/train': 1.6349835395812988} +11/06/2021 21:55:00 - INFO - __main__ - Step 4689: {'lr': 0.0004995931568314028, 'samples': 900288, 'steps': 4688, 'loss/train': 2.1520705223083496} +11/06/2021 21:55:00 - INFO - __main__ - Step 4690: {'lr': 0.0004995928541466111, 'samples': 900480, 'steps': 4689, 'loss/train': 2.086479902267456} +11/06/2021 21:55:01 - INFO - __main__ - Step 4691: {'lr': 0.0004995925513493567, 'samples': 900672, 'steps': 4690, 'loss/train': 2.070526123046875} +11/06/2021 21:55:01 - INFO - __main__ - Step 4692: {'lr': 0.0004995922484396397, 'samples': 900864, 'steps': 4691, 'loss/train': 1.8946828842163086} +11/06/2021 21:55:01 - INFO - __main__ - Step 4693: {'lr': 0.0004995919454174603, 'samples': 901056, 'steps': 4692, 'loss/train': 2.0533816814422607} +11/06/2021 21:55:02 - INFO - __main__ - Step 4694: {'lr': 0.0004995916422828187, 'samples': 901248, 'steps': 4693, 'loss/train': 1.6909483671188354} +11/06/2021 21:55:03 - INFO - __main__ - Step 4695: {'lr': 0.0004995913390357148, 'samples': 901440, 'steps': 4694, 'loss/train': 2.1296300888061523} +11/06/2021 21:55:03 - INFO - __main__ - Step 4696: {'lr': 0.0004995910356761491, 'samples': 901632, 'steps': 4695, 'loss/train': 1.5140820741653442} +11/06/2021 21:55:03 - INFO - __main__ - Step 4697: {'lr': 0.0004995907322041214, 'samples': 901824, 'steps': 4696, 'loss/train': 2.322920560836792} +11/06/2021 21:55:04 - INFO - __main__ - Step 4698: {'lr': 0.000499590428619632, 'samples': 902016, 'steps': 4697, 'loss/train': 1.875250220298767} +11/06/2021 21:55:05 - INFO - __main__ - Step 4699: {'lr': 0.000499590124922681, 'samples': 902208, 'steps': 4698, 'loss/train': 0.6247835159301758} +11/06/2021 21:55:05 - INFO - __main__ - Step 4700: {'lr': 0.0004995898211132685, 'samples': 902400, 'steps': 4699, 'loss/train': 2.233553171157837} +11/06/2021 21:55:06 - INFO - __main__ - Step 4701: {'lr': 0.0004995895171913947, 'samples': 902592, 'steps': 4700, 'loss/train': 2.2635233402252197} +11/06/2021 21:55:06 - INFO - __main__ - Step 4702: {'lr': 0.0004995892131570598, 'samples': 902784, 'steps': 4701, 'loss/train': 1.2235736846923828} +11/06/2021 21:55:06 - INFO - __main__ - Step 4703: {'lr': 0.0004995889090102638, 'samples': 902976, 'steps': 4702, 'loss/train': 1.9816572666168213} +11/06/2021 21:55:07 - INFO - __main__ - Step 4704: {'lr': 0.0004995886047510068, 'samples': 903168, 'steps': 4703, 'loss/train': 2.1657280921936035} +11/06/2021 21:55:08 - INFO - __main__ - Step 4705: {'lr': 0.0004995883003792891, 'samples': 903360, 'steps': 4704, 'loss/train': 2.1573469638824463} +11/06/2021 21:55:08 - INFO - __main__ - Step 4706: {'lr': 0.0004995879958951107, 'samples': 903552, 'steps': 4705, 'loss/train': 1.8357532024383545} +11/06/2021 21:55:08 - INFO - __main__ - Step 4707: {'lr': 0.0004995876912984719, 'samples': 903744, 'steps': 4706, 'loss/train': 2.194171667098999} +11/06/2021 21:55:09 - INFO - __main__ - Step 4708: {'lr': 0.0004995873865893727, 'samples': 903936, 'steps': 4707, 'loss/train': 2.122776985168457} +11/06/2021 21:55:10 - INFO - __main__ - Step 4709: {'lr': 0.0004995870817678133, 'samples': 904128, 'steps': 4708, 'loss/train': 1.9645999670028687} +11/06/2021 21:55:10 - INFO - __main__ - Step 4710: {'lr': 0.0004995867768337938, 'samples': 904320, 'steps': 4709, 'loss/train': 2.073693037033081} +11/06/2021 21:55:10 - INFO - __main__ - Step 4711: {'lr': 0.0004995864717873143, 'samples': 904512, 'steps': 4710, 'loss/train': 1.3138636350631714} +11/06/2021 21:55:11 - INFO - __main__ - Step 4712: {'lr': 0.000499586166628375, 'samples': 904704, 'steps': 4711, 'loss/train': 2.1905508041381836} +11/06/2021 21:55:11 - INFO - __main__ - Step 4713: {'lr': 0.0004995858613569761, 'samples': 904896, 'steps': 4712, 'loss/train': 2.189453363418579} +11/06/2021 21:55:12 - INFO - __main__ - Step 4714: {'lr': 0.0004995855559731176, 'samples': 905088, 'steps': 4713, 'loss/train': 2.266838550567627} +11/06/2021 21:55:12 - INFO - __main__ - Step 4715: {'lr': 0.0004995852504767997, 'samples': 905280, 'steps': 4714, 'loss/train': 2.4359450340270996} +11/06/2021 21:55:13 - INFO - __main__ - Step 4716: {'lr': 0.0004995849448680225, 'samples': 905472, 'steps': 4715, 'loss/train': 2.0849661827087402} +11/06/2021 21:55:13 - INFO - __main__ - Step 4717: {'lr': 0.0004995846391467862, 'samples': 905664, 'steps': 4716, 'loss/train': 2.252028465270996} +11/06/2021 21:55:13 - INFO - __main__ - Step 4718: {'lr': 0.000499584333313091, 'samples': 905856, 'steps': 4717, 'loss/train': 1.7350718975067139} +11/06/2021 21:55:14 - INFO - __main__ - Step 4719: {'lr': 0.0004995840273669369, 'samples': 906048, 'steps': 4718, 'loss/train': 2.1980574131011963} +11/06/2021 21:55:15 - INFO - __main__ - Step 4720: {'lr': 0.0004995837213083241, 'samples': 906240, 'steps': 4719, 'loss/train': 2.655808925628662} +11/06/2021 21:55:15 - INFO - __main__ - Step 4721: {'lr': 0.0004995834151372526, 'samples': 906432, 'steps': 4720, 'loss/train': 1.8203097581863403} +11/06/2021 21:55:16 - INFO - __main__ - Step 4722: {'lr': 0.0004995831088537229, 'samples': 906624, 'steps': 4721, 'loss/train': 1.9288336038589478} +11/06/2021 21:55:16 - INFO - __main__ - Step 4723: {'lr': 0.0004995828024577346, 'samples': 906816, 'steps': 4722, 'loss/train': 2.221000909805298} +11/06/2021 21:55:16 - INFO - __main__ - Step 4724: {'lr': 0.0004995824959492884, 'samples': 907008, 'steps': 4723, 'loss/train': 2.1988742351531982} +11/06/2021 21:55:17 - INFO - __main__ - Step 4725: {'lr': 0.0004995821893283841, 'samples': 907200, 'steps': 4724, 'loss/train': 1.5321357250213623} +11/06/2021 21:55:18 - INFO - __main__ - Step 4726: {'lr': 0.0004995818825950218, 'samples': 907392, 'steps': 4725, 'loss/train': 2.327254295349121} +11/06/2021 21:55:18 - INFO - __main__ - Step 4727: {'lr': 0.0004995815757492019, 'samples': 907584, 'steps': 4726, 'loss/train': 1.697227954864502} +11/06/2021 21:55:18 - INFO - __main__ - Step 4728: {'lr': 0.0004995812687909243, 'samples': 907776, 'steps': 4727, 'loss/train': 1.925517201423645} +11/06/2021 21:55:19 - INFO - __main__ - Step 4729: {'lr': 0.0004995809617201894, 'samples': 907968, 'steps': 4728, 'loss/train': 2.1235063076019287} +11/06/2021 21:55:20 - INFO - __main__ - Step 4730: {'lr': 0.000499580654536997, 'samples': 908160, 'steps': 4729, 'loss/train': 1.6067290306091309} +11/06/2021 21:55:20 - INFO - __main__ - Step 4731: {'lr': 0.0004995803472413474, 'samples': 908352, 'steps': 4730, 'loss/train': 2.062716245651245} +11/06/2021 21:55:21 - INFO - __main__ - Step 4732: {'lr': 0.0004995800398332409, 'samples': 908544, 'steps': 4731, 'loss/train': 2.0088040828704834} +11/06/2021 21:55:21 - INFO - __main__ - Step 4733: {'lr': 0.0004995797323126774, 'samples': 908736, 'steps': 4732, 'loss/train': 2.1273770332336426} +11/06/2021 21:55:21 - INFO - __main__ - Step 4734: {'lr': 0.0004995794246796571, 'samples': 908928, 'steps': 4733, 'loss/train': 1.9056154489517212} +11/06/2021 21:55:22 - INFO - __main__ - Step 4735: {'lr': 0.0004995791169341801, 'samples': 909120, 'steps': 4734, 'loss/train': 1.6100257635116577} +11/06/2021 21:55:23 - INFO - __main__ - Step 4736: {'lr': 0.0004995788090762467, 'samples': 909312, 'steps': 4735, 'loss/train': 1.8864790201187134} +11/06/2021 21:55:23 - INFO - __main__ - Step 4737: {'lr': 0.000499578501105857, 'samples': 909504, 'steps': 4736, 'loss/train': 1.9987335205078125} +11/06/2021 21:55:23 - INFO - __main__ - Step 4738: {'lr': 0.000499578193023011, 'samples': 909696, 'steps': 4737, 'loss/train': 2.262216567993164} +11/06/2021 21:55:24 - INFO - __main__ - Step 4739: {'lr': 0.0004995778848277088, 'samples': 909888, 'steps': 4738, 'loss/train': 1.9893282651901245} +11/06/2021 21:55:24 - INFO - __main__ - Step 4740: {'lr': 0.0004995775765199509, 'samples': 910080, 'steps': 4739, 'loss/train': 2.1088781356811523} +11/06/2021 21:55:25 - INFO - __main__ - Step 4741: {'lr': 0.000499577268099737, 'samples': 910272, 'steps': 4740, 'loss/train': 1.7496652603149414} +11/06/2021 21:55:25 - INFO - __main__ - Step 4742: {'lr': 0.0004995769595670675, 'samples': 910464, 'steps': 4741, 'loss/train': 1.8243907690048218} +11/06/2021 21:55:26 - INFO - __main__ - Step 4743: {'lr': 0.0004995766509219425, 'samples': 910656, 'steps': 4742, 'loss/train': 1.8536678552627563} +11/06/2021 21:55:26 - INFO - __main__ - Step 4744: {'lr': 0.0004995763421643621, 'samples': 910848, 'steps': 4743, 'loss/train': 2.054396152496338} +11/06/2021 21:55:26 - INFO - __main__ - Step 4745: {'lr': 0.0004995760332943264, 'samples': 911040, 'steps': 4744, 'loss/train': 2.0926995277404785} +11/06/2021 21:55:28 - INFO - __main__ - Step 4746: {'lr': 0.0004995757243118356, 'samples': 911232, 'steps': 4745, 'loss/train': 2.342751979827881} +11/06/2021 21:55:28 - INFO - __main__ - Step 4747: {'lr': 0.0004995754152168899, 'samples': 911424, 'steps': 4746, 'loss/train': 1.4246360063552856} +11/06/2021 21:55:28 - INFO - __main__ - Step 4748: {'lr': 0.0004995751060094893, 'samples': 911616, 'steps': 4747, 'loss/train': 1.6921579837799072} +11/06/2021 21:55:29 - INFO - __main__ - Step 4749: {'lr': 0.000499574796689634, 'samples': 911808, 'steps': 4748, 'loss/train': 1.5545167922973633} +11/06/2021 21:55:29 - INFO - __main__ - Step 4750: {'lr': 0.0004995744872573242, 'samples': 912000, 'steps': 4749, 'loss/train': 1.6792792081832886} +11/06/2021 21:55:30 - INFO - __main__ - Step 4751: {'lr': 0.00049957417771256, 'samples': 912192, 'steps': 4750, 'loss/train': 2.301424741744995} +11/06/2021 21:55:31 - INFO - __main__ - Step 4752: {'lr': 0.0004995738680553415, 'samples': 912384, 'steps': 4751, 'loss/train': 2.0780701637268066} +11/06/2021 21:55:31 - INFO - __main__ - Step 4753: {'lr': 0.0004995735582856689, 'samples': 912576, 'steps': 4752, 'loss/train': 2.5025558471679688} +11/06/2021 21:55:31 - INFO - __main__ - Step 4754: {'lr': 0.0004995732484035422, 'samples': 912768, 'steps': 4753, 'loss/train': 1.6821069717407227} +11/06/2021 21:55:32 - INFO - __main__ - Step 4755: {'lr': 0.0004995729384089618, 'samples': 912960, 'steps': 4754, 'loss/train': 1.8580917119979858} +11/06/2021 21:55:32 - INFO - __main__ - Step 4756: {'lr': 0.0004995726283019275, 'samples': 913152, 'steps': 4755, 'loss/train': 5.469394207000732} +11/06/2021 21:55:33 - INFO - __main__ - Step 4757: {'lr': 0.0004995723180824397, 'samples': 913344, 'steps': 4756, 'loss/train': 2.1818153858184814} +11/06/2021 21:55:33 - INFO - __main__ - Step 4758: {'lr': 0.0004995720077504986, 'samples': 913536, 'steps': 4757, 'loss/train': 1.8625547885894775} +11/06/2021 21:55:34 - INFO - __main__ - Step 4759: {'lr': 0.0004995716973061041, 'samples': 913728, 'steps': 4758, 'loss/train': 2.1026546955108643} +11/06/2021 21:55:34 - INFO - __main__ - Step 4760: {'lr': 0.0004995713867492564, 'samples': 913920, 'steps': 4759, 'loss/train': 2.178823471069336} +11/06/2021 21:55:34 - INFO - __main__ - Step 4761: {'lr': 0.0004995710760799557, 'samples': 914112, 'steps': 4760, 'loss/train': 1.872559905052185} +11/06/2021 21:55:36 - INFO - __main__ - Step 4762: {'lr': 0.0004995707652982022, 'samples': 914304, 'steps': 4761, 'loss/train': 1.871140718460083} +11/06/2021 21:55:36 - INFO - __main__ - Step 4763: {'lr': 0.0004995704544039958, 'samples': 914496, 'steps': 4762, 'loss/train': 2.3007659912109375} +11/06/2021 21:55:36 - INFO - __main__ - Step 4764: {'lr': 0.0004995701433973369, 'samples': 914688, 'steps': 4763, 'loss/train': 0.6473186016082764} +11/06/2021 21:55:37 - INFO - __main__ - Step 4765: {'lr': 0.0004995698322782257, 'samples': 914880, 'steps': 4764, 'loss/train': 1.983769416809082} +11/06/2021 21:55:37 - INFO - __main__ - Step 4766: {'lr': 0.0004995695210466619, 'samples': 915072, 'steps': 4765, 'loss/train': 1.983061671257019} +11/06/2021 21:55:37 - INFO - __main__ - Step 4767: {'lr': 0.0004995692097026461, 'samples': 915264, 'steps': 4766, 'loss/train': 1.7104268074035645} +11/06/2021 21:55:38 - INFO - __main__ - Step 4768: {'lr': 0.0004995688982461783, 'samples': 915456, 'steps': 4767, 'loss/train': 2.606029748916626} +11/06/2021 21:55:39 - INFO - __main__ - Step 4769: {'lr': 0.0004995685866772586, 'samples': 915648, 'steps': 4768, 'loss/train': 1.642903447151184} +11/06/2021 21:55:39 - INFO - __main__ - Step 4770: {'lr': 0.000499568274995887, 'samples': 915840, 'steps': 4769, 'loss/train': 2.383634328842163} +11/06/2021 21:55:39 - INFO - __main__ - Step 4771: {'lr': 0.0004995679632020639, 'samples': 916032, 'steps': 4770, 'loss/train': 2.0660829544067383} +11/06/2021 21:55:40 - INFO - __main__ - Step 4772: {'lr': 0.0004995676512957892, 'samples': 916224, 'steps': 4771, 'loss/train': 2.0167953968048096} +11/06/2021 21:55:41 - INFO - __main__ - Step 4773: {'lr': 0.0004995673392770634, 'samples': 916416, 'steps': 4772, 'loss/train': 2.2633042335510254} +11/06/2021 21:55:41 - INFO - __main__ - Step 4774: {'lr': 0.0004995670271458863, 'samples': 916608, 'steps': 4773, 'loss/train': 2.0929172039031982} +11/06/2021 21:55:42 - INFO - __main__ - Step 4775: {'lr': 0.0004995667149022581, 'samples': 916800, 'steps': 4774, 'loss/train': 2.1483800411224365} +11/06/2021 21:55:42 - INFO - __main__ - Step 4776: {'lr': 0.000499566402546179, 'samples': 916992, 'steps': 4775, 'loss/train': 1.7766259908676147} +11/06/2021 21:55:42 - INFO - __main__ - Step 4777: {'lr': 0.0004995660900776491, 'samples': 917184, 'steps': 4776, 'loss/train': 1.8469535112380981} +11/06/2021 21:55:43 - INFO - __main__ - Step 4778: {'lr': 0.0004995657774966686, 'samples': 917376, 'steps': 4777, 'loss/train': 2.0229592323303223} +11/06/2021 21:55:44 - INFO - __main__ - Step 4779: {'lr': 0.0004995654648032377, 'samples': 917568, 'steps': 4778, 'loss/train': 1.3622205257415771} +11/06/2021 21:55:44 - INFO - __main__ - Step 4780: {'lr': 0.0004995651519973563, 'samples': 917760, 'steps': 4779, 'loss/train': 2.1144587993621826} +11/06/2021 21:55:44 - INFO - __main__ - Step 4781: {'lr': 0.0004995648390790249, 'samples': 917952, 'steps': 4780, 'loss/train': 1.954245686531067} +11/06/2021 21:55:45 - INFO - __main__ - Step 4782: {'lr': 0.0004995645260482432, 'samples': 918144, 'steps': 4781, 'loss/train': 2.7569739818573} +11/06/2021 21:55:46 - INFO - __main__ - Step 4783: {'lr': 0.0004995642129050117, 'samples': 918336, 'steps': 4782, 'loss/train': 1.3092371225357056} +11/06/2021 21:55:46 - INFO - __main__ - Step 4784: {'lr': 0.0004995638996493304, 'samples': 918528, 'steps': 4783, 'loss/train': 1.6529567241668701} +11/06/2021 21:55:46 - INFO - __main__ - Step 4785: {'lr': 0.0004995635862811994, 'samples': 918720, 'steps': 4784, 'loss/train': 2.129288911819458} +11/06/2021 21:55:47 - INFO - __main__ - Step 4786: {'lr': 0.000499563272800619, 'samples': 918912, 'steps': 4785, 'loss/train': 2.2793755531311035} +11/06/2021 21:55:47 - INFO - __main__ - Step 4787: {'lr': 0.0004995629592075892, 'samples': 919104, 'steps': 4786, 'loss/train': 2.265683174133301} +11/06/2021 21:55:48 - INFO - __main__ - Step 4788: {'lr': 0.0004995626455021101, 'samples': 919296, 'steps': 4787, 'loss/train': 2.4997894763946533} +11/06/2021 21:55:49 - INFO - __main__ - Step 4789: {'lr': 0.0004995623316841821, 'samples': 919488, 'steps': 4788, 'loss/train': 2.061391592025757} +11/06/2021 21:55:49 - INFO - __main__ - Step 4790: {'lr': 0.0004995620177538051, 'samples': 919680, 'steps': 4789, 'loss/train': 2.428020715713501} +11/06/2021 21:55:50 - INFO - __main__ - Step 4791: {'lr': 0.0004995617037109792, 'samples': 919872, 'steps': 4790, 'loss/train': 1.7995200157165527} +11/06/2021 21:55:50 - INFO - __main__ - Step 4792: {'lr': 0.0004995613895557048, 'samples': 920064, 'steps': 4791, 'loss/train': 1.883157730102539} +11/06/2021 21:55:51 - INFO - __main__ - Step 4793: {'lr': 0.0004995610752879818, 'samples': 920256, 'steps': 4792, 'loss/train': 2.25808048248291} +11/06/2021 21:55:51 - INFO - __main__ - Step 4794: {'lr': 0.0004995607609078104, 'samples': 920448, 'steps': 4793, 'loss/train': 2.118656873703003} +11/06/2021 21:55:52 - INFO - __main__ - Step 4795: {'lr': 0.0004995604464151908, 'samples': 920640, 'steps': 4794, 'loss/train': 2.104627847671509} +11/06/2021 21:55:52 - INFO - __main__ - Step 4796: {'lr': 0.0004995601318101231, 'samples': 920832, 'steps': 4795, 'loss/train': 2.0214784145355225} +11/06/2021 21:55:52 - INFO - __main__ - Step 4797: {'lr': 0.0004995598170926074, 'samples': 921024, 'steps': 4796, 'loss/train': 1.9268819093704224} +11/06/2021 21:55:53 - INFO - __main__ - Step 4798: {'lr': 0.000499559502262644, 'samples': 921216, 'steps': 4797, 'loss/train': 1.5341185331344604} +11/06/2021 21:55:54 - INFO - __main__ - Step 4799: {'lr': 0.000499559187320233, 'samples': 921408, 'steps': 4798, 'loss/train': 2.1940500736236572} +11/06/2021 21:55:54 - INFO - __main__ - Step 4800: {'lr': 0.0004995588722653743, 'samples': 921600, 'steps': 4799, 'loss/train': 1.9055429697036743} +11/06/2021 21:55:54 - INFO - __main__ - Step 4801: {'lr': 0.0004995585570980684, 'samples': 921792, 'steps': 4800, 'loss/train': 2.3950815200805664} +11/06/2021 21:55:55 - INFO - __main__ - Step 4802: {'lr': 0.0004995582418183151, 'samples': 921984, 'steps': 4801, 'loss/train': 1.969565510749817} +11/06/2021 21:55:55 - INFO - __main__ - Step 4803: {'lr': 0.0004995579264261148, 'samples': 922176, 'steps': 4802, 'loss/train': 1.7654180526733398} +11/06/2021 21:55:56 - INFO - __main__ - Step 4804: {'lr': 0.0004995576109214676, 'samples': 922368, 'steps': 4803, 'loss/train': 2.6347360610961914} +11/06/2021 21:55:57 - INFO - __main__ - Step 4805: {'lr': 0.0004995572953043736, 'samples': 922560, 'steps': 4804, 'loss/train': 1.7408865690231323} +11/06/2021 21:55:57 - INFO - __main__ - Step 4806: {'lr': 0.0004995569795748328, 'samples': 922752, 'steps': 4805, 'loss/train': 1.1435315608978271} +11/06/2021 21:55:57 - INFO - __main__ - Step 4807: {'lr': 0.0004995566637328456, 'samples': 922944, 'steps': 4806, 'loss/train': 1.0032495260238647} +11/06/2021 21:55:58 - INFO - __main__ - Step 4808: {'lr': 0.0004995563477784119, 'samples': 923136, 'steps': 4807, 'loss/train': 2.07177472114563} +11/06/2021 21:55:59 - INFO - __main__ - Step 4809: {'lr': 0.000499556031711532, 'samples': 923328, 'steps': 4808, 'loss/train': 2.4952619075775146} +11/06/2021 21:55:59 - INFO - __main__ - Step 4810: {'lr': 0.000499555715532206, 'samples': 923520, 'steps': 4809, 'loss/train': 1.7936309576034546} +11/06/2021 21:55:59 - INFO - __main__ - Step 4811: {'lr': 0.0004995553992404342, 'samples': 923712, 'steps': 4810, 'loss/train': 1.8712501525878906} +11/06/2021 21:56:00 - INFO - __main__ - Step 4812: {'lr': 0.0004995550828362163, 'samples': 923904, 'steps': 4811, 'loss/train': 2.1187033653259277} +11/06/2021 21:56:00 - INFO - __main__ - Step 4813: {'lr': 0.000499554766319553, 'samples': 924096, 'steps': 4812, 'loss/train': 1.8378645181655884} +11/06/2021 21:56:01 - INFO - __main__ - Step 4814: {'lr': 0.0004995544496904441, 'samples': 924288, 'steps': 4813, 'loss/train': 2.4952051639556885} +11/06/2021 21:56:01 - INFO - __main__ - Step 4815: {'lr': 0.0004995541329488897, 'samples': 924480, 'steps': 4814, 'loss/train': 1.766731858253479} +11/06/2021 21:56:02 - INFO - __main__ - Step 4816: {'lr': 0.0004995538160948901, 'samples': 924672, 'steps': 4815, 'loss/train': 1.933300495147705} +11/06/2021 21:56:02 - INFO - __main__ - Step 4817: {'lr': 0.0004995534991284455, 'samples': 924864, 'steps': 4816, 'loss/train': 1.8735243082046509} +11/06/2021 21:56:02 - INFO - __main__ - Step 4818: {'lr': 0.0004995531820495559, 'samples': 925056, 'steps': 4817, 'loss/train': 2.582186460494995} +11/06/2021 21:56:03 - INFO - __main__ - Step 4819: {'lr': 0.0004995528648582214, 'samples': 925248, 'steps': 4818, 'loss/train': 2.391286611557007} +11/06/2021 21:56:04 - INFO - __main__ - Step 4820: {'lr': 0.0004995525475544423, 'samples': 925440, 'steps': 4819, 'loss/train': 2.931082248687744} +11/06/2021 21:56:04 - INFO - __main__ - Step 4821: {'lr': 0.0004995522301382187, 'samples': 925632, 'steps': 4820, 'loss/train': 1.65629243850708} +11/06/2021 21:56:05 - INFO - __main__ - Step 4822: {'lr': 0.0004995519126095506, 'samples': 925824, 'steps': 4821, 'loss/train': 2.3707022666931152} +11/06/2021 21:56:05 - INFO - __main__ - Step 4823: {'lr': 0.0004995515949684384, 'samples': 926016, 'steps': 4822, 'loss/train': 1.6298257112503052} +11/06/2021 21:56:05 - INFO - __main__ - Step 4824: {'lr': 0.000499551277214882, 'samples': 926208, 'steps': 4823, 'loss/train': 1.6904128789901733} +11/06/2021 21:56:06 - INFO - __main__ - Step 4825: {'lr': 0.0004995509593488818, 'samples': 926400, 'steps': 4824, 'loss/train': 2.1001079082489014} +11/06/2021 21:56:07 - INFO - __main__ - Step 4826: {'lr': 0.0004995506413704376, 'samples': 926592, 'steps': 4825, 'loss/train': 1.8763246536254883} +11/06/2021 21:56:07 - INFO - __main__ - Step 4827: {'lr': 0.0004995503232795498, 'samples': 926784, 'steps': 4826, 'loss/train': 1.9993937015533447} +11/06/2021 21:56:07 - INFO - __main__ - Step 4828: {'lr': 0.0004995500050762185, 'samples': 926976, 'steps': 4827, 'loss/train': 2.1457080841064453} +11/06/2021 21:56:08 - INFO - __main__ - Step 4829: {'lr': 0.0004995496867604438, 'samples': 927168, 'steps': 4828, 'loss/train': 1.929814338684082} +11/06/2021 21:56:09 - INFO - __main__ - Step 4830: {'lr': 0.0004995493683322259, 'samples': 927360, 'steps': 4829, 'loss/train': 1.904067873954773} +11/06/2021 21:56:09 - INFO - __main__ - Step 4831: {'lr': 0.0004995490497915649, 'samples': 927552, 'steps': 4830, 'loss/train': 2.4040565490722656} +11/06/2021 21:56:09 - INFO - __main__ - Step 4832: {'lr': 0.0004995487311384609, 'samples': 927744, 'steps': 4831, 'loss/train': 2.00188946723938} +11/06/2021 21:56:10 - INFO - __main__ - Step 4833: {'lr': 0.0004995484123729141, 'samples': 927936, 'steps': 4832, 'loss/train': 2.0301706790924072} +11/06/2021 21:56:10 - INFO - __main__ - Step 4834: {'lr': 0.0004995480934949247, 'samples': 928128, 'steps': 4833, 'loss/train': 1.7859026193618774} +11/06/2021 21:56:11 - INFO - __main__ - Step 4835: {'lr': 0.0004995477745044927, 'samples': 928320, 'steps': 4834, 'loss/train': 1.3403795957565308} +11/06/2021 21:56:12 - INFO - __main__ - Step 4836: {'lr': 0.0004995474554016184, 'samples': 928512, 'steps': 4835, 'loss/train': 2.4826717376708984} +11/06/2021 21:56:12 - INFO - __main__ - Step 4837: {'lr': 0.0004995471361863017, 'samples': 928704, 'steps': 4836, 'loss/train': 2.1667168140411377} +11/06/2021 21:56:12 - INFO - __main__ - Step 4838: {'lr': 0.0004995468168585431, 'samples': 928896, 'steps': 4837, 'loss/train': 1.3020102977752686} +11/06/2021 21:56:13 - INFO - __main__ - Step 4839: {'lr': 0.0004995464974183424, 'samples': 929088, 'steps': 4838, 'loss/train': 2.1668708324432373} +11/06/2021 21:56:14 - INFO - __main__ - Step 4840: {'lr': 0.0004995461778657002, 'samples': 929280, 'steps': 4839, 'loss/train': 1.8353111743927002} +11/06/2021 21:56:14 - INFO - __main__ - Step 4841: {'lr': 0.000499545858200616, 'samples': 929472, 'steps': 4840, 'loss/train': 1.82950758934021} +11/06/2021 21:56:14 - INFO - __main__ - Step 4842: {'lr': 0.0004995455384230904, 'samples': 929664, 'steps': 4841, 'loss/train': 1.8687033653259277} +11/06/2021 21:56:15 - INFO - __main__ - Step 4843: {'lr': 0.0004995452185331235, 'samples': 929856, 'steps': 4842, 'loss/train': 0.33405929803848267} +11/06/2021 21:56:15 - INFO - __main__ - Step 4844: {'lr': 0.0004995448985307153, 'samples': 930048, 'steps': 4843, 'loss/train': 1.0525949001312256} +11/06/2021 21:56:16 - INFO - __main__ - Step 4845: {'lr': 0.0004995445784158661, 'samples': 930240, 'steps': 4844, 'loss/train': 2.037909507751465} +11/06/2021 21:56:16 - INFO - __main__ - Step 4846: {'lr': 0.0004995442581885759, 'samples': 930432, 'steps': 4845, 'loss/train': 1.789475679397583} +11/06/2021 21:56:17 - INFO - __main__ - Step 4847: {'lr': 0.0004995439378488449, 'samples': 930624, 'steps': 4846, 'loss/train': 1.7952702045440674} +11/06/2021 21:56:17 - INFO - __main__ - Step 4848: {'lr': 0.0004995436173966733, 'samples': 930816, 'steps': 4847, 'loss/train': 1.640943169593811} +11/06/2021 21:56:17 - INFO - __main__ - Step 4849: {'lr': 0.0004995432968320611, 'samples': 931008, 'steps': 4848, 'loss/train': 2.3322298526763916} +11/06/2021 21:56:19 - INFO - __main__ - Step 4850: {'lr': 0.0004995429761550086, 'samples': 931200, 'steps': 4849, 'loss/train': 2.3583528995513916} +11/06/2021 21:56:19 - INFO - __main__ - Step 4851: {'lr': 0.0004995426553655159, 'samples': 931392, 'steps': 4850, 'loss/train': 1.6499428749084473} +11/06/2021 21:56:19 - INFO - __main__ - Step 4852: {'lr': 0.0004995423344635831, 'samples': 931584, 'steps': 4851, 'loss/train': 1.9984158277511597} +11/06/2021 21:56:20 - INFO - __main__ - Step 4853: {'lr': 0.0004995420134492105, 'samples': 931776, 'steps': 4852, 'loss/train': 2.299149513244629} +11/06/2021 21:56:20 - INFO - __main__ - Step 4854: {'lr': 0.0004995416923223979, 'samples': 931968, 'steps': 4853, 'loss/train': 2.4122209548950195} +11/06/2021 21:56:20 - INFO - __main__ - Step 4855: {'lr': 0.0004995413710831458, 'samples': 932160, 'steps': 4854, 'loss/train': 2.0572216510772705} +11/06/2021 21:56:21 - INFO - __main__ - Step 4856: {'lr': 0.0004995410497314542, 'samples': 932352, 'steps': 4855, 'loss/train': 1.9187612533569336} +11/06/2021 21:56:22 - INFO - __main__ - Step 4857: {'lr': 0.0004995407282673232, 'samples': 932544, 'steps': 4856, 'loss/train': 1.4883348941802979} +11/06/2021 21:56:22 - INFO - __main__ - Step 4858: {'lr': 0.000499540406690753, 'samples': 932736, 'steps': 4857, 'loss/train': 1.9691627025604248} +11/06/2021 21:56:22 - INFO - __main__ - Step 4859: {'lr': 0.0004995400850017438, 'samples': 932928, 'steps': 4858, 'loss/train': 1.930557131767273} +11/06/2021 21:56:23 - INFO - __main__ - Step 4860: {'lr': 0.0004995397632002957, 'samples': 933120, 'steps': 4859, 'loss/train': 1.965431809425354} +11/06/2021 21:56:24 - INFO - __main__ - Step 4861: {'lr': 0.0004995394412864088, 'samples': 933312, 'steps': 4860, 'loss/train': 1.9139984846115112} +11/06/2021 21:56:24 - INFO - __main__ - Step 4862: {'lr': 0.0004995391192600834, 'samples': 933504, 'steps': 4861, 'loss/train': 2.268007516860962} +11/06/2021 21:56:24 - INFO - __main__ - Step 4863: {'lr': 0.0004995387971213194, 'samples': 933696, 'steps': 4862, 'loss/train': 1.8037782907485962} +11/06/2021 21:56:25 - INFO - __main__ - Step 4864: {'lr': 0.000499538474870117, 'samples': 933888, 'steps': 4863, 'loss/train': 1.7647819519042969} +11/06/2021 21:56:25 - INFO - __main__ - Step 4865: {'lr': 0.0004995381525064765, 'samples': 934080, 'steps': 4864, 'loss/train': 2.0817017555236816} +11/06/2021 21:56:26 - INFO - __main__ - Step 4866: {'lr': 0.0004995378300303979, 'samples': 934272, 'steps': 4865, 'loss/train': 2.1606099605560303} +11/06/2021 21:56:27 - INFO - __main__ - Step 4867: {'lr': 0.0004995375074418815, 'samples': 934464, 'steps': 4866, 'loss/train': 2.0382091999053955} +11/06/2021 21:56:27 - INFO - __main__ - Step 4868: {'lr': 0.0004995371847409273, 'samples': 934656, 'steps': 4867, 'loss/train': 0.9957026243209839} +11/06/2021 21:56:27 - INFO - __main__ - Step 4869: {'lr': 0.0004995368619275355, 'samples': 934848, 'steps': 4868, 'loss/train': 1.8586081266403198} +11/06/2021 21:56:28 - INFO - __main__ - Step 4870: {'lr': 0.0004995365390017062, 'samples': 935040, 'steps': 4869, 'loss/train': 1.3379945755004883} +11/06/2021 21:56:28 - INFO - __main__ - Step 4871: {'lr': 0.0004995362159634396, 'samples': 935232, 'steps': 4870, 'loss/train': 1.8667609691619873} +11/06/2021 21:56:29 - INFO - __main__ - Step 4872: {'lr': 0.0004995358928127359, 'samples': 935424, 'steps': 4871, 'loss/train': 1.3676517009735107} +11/06/2021 21:56:29 - INFO - __main__ - Step 4873: {'lr': 0.0004995355695495952, 'samples': 935616, 'steps': 4872, 'loss/train': 1.948101282119751} +11/06/2021 21:56:30 - INFO - __main__ - Step 4874: {'lr': 0.0004995352461740174, 'samples': 935808, 'steps': 4873, 'loss/train': 1.8517183065414429} +11/06/2021 21:56:30 - INFO - __main__ - Step 4875: {'lr': 0.0004995349226860031, 'samples': 936000, 'steps': 4874, 'loss/train': 1.5299654006958008} +11/06/2021 21:56:30 - INFO - __main__ - Step 4876: {'lr': 0.0004995345990855522, 'samples': 936192, 'steps': 4875, 'loss/train': 2.013723850250244} +11/06/2021 21:56:31 - INFO - __main__ - Step 4877: {'lr': 0.0004995342753726647, 'samples': 936384, 'steps': 4876, 'loss/train': 2.0262885093688965} +11/06/2021 21:56:32 - INFO - __main__ - Step 4878: {'lr': 0.0004995339515473411, 'samples': 936576, 'steps': 4877, 'loss/train': 1.6470019817352295} +11/06/2021 21:56:32 - INFO - __main__ - Step 4879: {'lr': 0.0004995336276095812, 'samples': 936768, 'steps': 4878, 'loss/train': 1.9853967428207397} +11/06/2021 21:56:32 - INFO - __main__ - Step 4880: {'lr': 0.0004995333035593853, 'samples': 936960, 'steps': 4879, 'loss/train': 1.7942310571670532} +11/06/2021 21:56:33 - INFO - __main__ - Step 4881: {'lr': 0.0004995329793967537, 'samples': 937152, 'steps': 4880, 'loss/train': 2.1231250762939453} +11/06/2021 21:56:34 - INFO - __main__ - Step 4882: {'lr': 0.0004995326551216862, 'samples': 937344, 'steps': 4881, 'loss/train': 1.599252700805664} +11/06/2021 21:56:34 - INFO - __main__ - Step 4883: {'lr': 0.0004995323307341832, 'samples': 937536, 'steps': 4882, 'loss/train': 1.833884596824646} +11/06/2021 21:56:34 - INFO - __main__ - Step 4884: {'lr': 0.0004995320062342449, 'samples': 937728, 'steps': 4883, 'loss/train': 1.6169829368591309} +11/06/2021 21:56:35 - INFO - __main__ - Step 4885: {'lr': 0.0004995316816218712, 'samples': 937920, 'steps': 4884, 'loss/train': 2.102433681488037} +11/06/2021 21:56:35 - INFO - __main__ - Step 4886: {'lr': 0.0004995313568970625, 'samples': 938112, 'steps': 4885, 'loss/train': 2.166229724884033} +11/06/2021 21:56:36 - INFO - __main__ - Step 4887: {'lr': 0.0004995310320598187, 'samples': 938304, 'steps': 4886, 'loss/train': 2.130415916442871} +11/06/2021 21:56:36 - INFO - __main__ - Step 4888: {'lr': 0.0004995307071101401, 'samples': 938496, 'steps': 4887, 'loss/train': 2.281303882598877} +11/06/2021 21:56:37 - INFO - __main__ - Step 4889: {'lr': 0.0004995303820480268, 'samples': 938688, 'steps': 4888, 'loss/train': 1.7925283908843994} +11/06/2021 21:56:37 - INFO - __main__ - Step 4890: {'lr': 0.000499530056873479, 'samples': 938880, 'steps': 4889, 'loss/train': 2.1150357723236084} +11/06/2021 21:56:37 - INFO - __main__ - Step 4891: {'lr': 0.0004995297315864968, 'samples': 939072, 'steps': 4890, 'loss/train': 1.8841792345046997} +11/06/2021 21:56:39 - INFO - __main__ - Step 4892: {'lr': 0.0004995294061870802, 'samples': 939264, 'steps': 4891, 'loss/train': 1.9895226955413818} +11/06/2021 21:56:39 - INFO - __main__ - Step 4893: {'lr': 0.0004995290806752297, 'samples': 939456, 'steps': 4892, 'loss/train': 2.05294132232666} +11/06/2021 21:56:39 - INFO - __main__ - Step 4894: {'lr': 0.0004995287550509452, 'samples': 939648, 'steps': 4893, 'loss/train': 1.6693605184555054} +11/06/2021 21:56:40 - INFO - __main__ - Step 4895: {'lr': 0.0004995284293142268, 'samples': 939840, 'steps': 4894, 'loss/train': 2.2964420318603516} +11/06/2021 21:56:40 - INFO - __main__ - Step 4896: {'lr': 0.0004995281034650748, 'samples': 940032, 'steps': 4895, 'loss/train': 2.0679450035095215} +11/06/2021 21:56:41 - INFO - __main__ - Step 4897: {'lr': 0.0004995277775034894, 'samples': 940224, 'steps': 4896, 'loss/train': 1.8550939559936523} +11/06/2021 21:56:41 - INFO - __main__ - Step 4898: {'lr': 0.0004995274514294706, 'samples': 940416, 'steps': 4897, 'loss/train': 1.983759880065918} +11/06/2021 21:56:42 - INFO - __main__ - Step 4899: {'lr': 0.0004995271252430184, 'samples': 940608, 'steps': 4898, 'loss/train': 2.2435123920440674} +11/06/2021 21:56:42 - INFO - __main__ - Step 4900: {'lr': 0.0004995267989441332, 'samples': 940800, 'steps': 4899, 'loss/train': 1.9692909717559814} +11/06/2021 21:56:42 - INFO - __main__ - Step 4901: {'lr': 0.0004995264725328151, 'samples': 940992, 'steps': 4900, 'loss/train': 1.1252635717391968} +11/06/2021 21:56:43 - INFO - __main__ - Step 4902: {'lr': 0.0004995261460090644, 'samples': 941184, 'steps': 4901, 'loss/train': 2.1014087200164795} +11/06/2021 21:56:44 - INFO - __main__ - Step 4903: {'lr': 0.0004995258193728809, 'samples': 941376, 'steps': 4902, 'loss/train': 2.087357521057129} +11/06/2021 21:56:44 - INFO - __main__ - Step 4904: {'lr': 0.0004995254926242649, 'samples': 941568, 'steps': 4903, 'loss/train': 1.3872030973434448} +11/06/2021 21:56:44 - INFO - __main__ - Step 4905: {'lr': 0.0004995251657632165, 'samples': 941760, 'steps': 4904, 'loss/train': 1.6950825452804565} +11/06/2021 21:56:45 - INFO - __main__ - Step 4906: {'lr': 0.000499524838789736, 'samples': 941952, 'steps': 4905, 'loss/train': 2.146413803100586} +11/06/2021 21:56:46 - INFO - __main__ - Step 4907: {'lr': 0.0004995245117038235, 'samples': 942144, 'steps': 4906, 'loss/train': 2.0605762004852295} +11/06/2021 21:56:46 - INFO - __main__ - Step 4908: {'lr': 0.0004995241845054791, 'samples': 942336, 'steps': 4907, 'loss/train': 2.1872684955596924} +11/06/2021 21:56:46 - INFO - __main__ - Step 4909: {'lr': 0.0004995238571947029, 'samples': 942528, 'steps': 4908, 'loss/train': 1.7782576084136963} +11/06/2021 21:56:47 - INFO - __main__ - Step 4910: {'lr': 0.0004995235297714951, 'samples': 942720, 'steps': 4909, 'loss/train': 1.769343614578247} +11/06/2021 21:56:47 - INFO - __main__ - Step 4911: {'lr': 0.0004995232022358559, 'samples': 942912, 'steps': 4910, 'loss/train': 2.6425294876098633} +11/06/2021 21:56:48 - INFO - __main__ - Step 4912: {'lr': 0.0004995228745877853, 'samples': 943104, 'steps': 4911, 'loss/train': 1.9566208124160767} +11/06/2021 21:56:49 - INFO - __main__ - Step 4913: {'lr': 0.0004995225468272836, 'samples': 943296, 'steps': 4912, 'loss/train': 1.9008264541625977} +11/06/2021 21:56:49 - INFO - __main__ - Step 4914: {'lr': 0.0004995222189543509, 'samples': 943488, 'steps': 4913, 'loss/train': 6.304197311401367} +11/06/2021 21:56:49 - INFO - __main__ - Step 4915: {'lr': 0.0004995218909689873, 'samples': 943680, 'steps': 4914, 'loss/train': 1.216681718826294} +11/06/2021 21:56:50 - INFO - __main__ - Step 4916: {'lr': 0.0004995215628711931, 'samples': 943872, 'steps': 4915, 'loss/train': 2.1877267360687256} +11/06/2021 21:56:50 - INFO - __main__ - Step 4917: {'lr': 0.0004995212346609682, 'samples': 944064, 'steps': 4916, 'loss/train': 2.259002923965454} +11/06/2021 21:56:51 - INFO - __main__ - Step 4918: {'lr': 0.0004995209063383129, 'samples': 944256, 'steps': 4917, 'loss/train': 1.607182264328003} +11/06/2021 21:56:51 - INFO - __main__ - Step 4919: {'lr': 0.0004995205779032274, 'samples': 944448, 'steps': 4918, 'loss/train': 2.302341938018799} +11/06/2021 21:56:52 - INFO - __main__ - Step 4920: {'lr': 0.0004995202493557118, 'samples': 944640, 'steps': 4919, 'loss/train': 1.7484567165374756} +11/06/2021 21:56:52 - INFO - __main__ - Step 4921: {'lr': 0.0004995199206957662, 'samples': 944832, 'steps': 4920, 'loss/train': 2.0463926792144775} +11/06/2021 21:56:53 - INFO - __main__ - Step 4922: {'lr': 0.0004995195919233906, 'samples': 945024, 'steps': 4921, 'loss/train': 2.1027209758758545} +11/06/2021 21:56:54 - INFO - __main__ - Step 4923: {'lr': 0.0004995192630385855, 'samples': 945216, 'steps': 4922, 'loss/train': 1.897849678993225} +11/06/2021 21:56:54 - INFO - __main__ - Step 4924: {'lr': 0.0004995189340413509, 'samples': 945408, 'steps': 4923, 'loss/train': 1.5796188116073608} +11/06/2021 21:56:55 - INFO - __main__ - Step 4925: {'lr': 0.0004995186049316868, 'samples': 945600, 'steps': 4924, 'loss/train': 2.1608316898345947} +11/06/2021 21:56:55 - INFO - __main__ - Step 4926: {'lr': 0.0004995182757095935, 'samples': 945792, 'steps': 4925, 'loss/train': 2.3778295516967773} +11/06/2021 21:56:55 - INFO - __main__ - Step 4927: {'lr': 0.0004995179463750712, 'samples': 945984, 'steps': 4926, 'loss/train': 2.6206376552581787} +11/06/2021 21:56:56 - INFO - __main__ - Step 4928: {'lr': 0.0004995176169281199, 'samples': 946176, 'steps': 4927, 'loss/train': 2.371328115463257} +11/06/2021 21:56:57 - INFO - __main__ - Step 4929: {'lr': 0.0004995172873687398, 'samples': 946368, 'steps': 4928, 'loss/train': 2.762335777282715} +11/06/2021 21:56:57 - INFO - __main__ - Step 4930: {'lr': 0.0004995169576969311, 'samples': 946560, 'steps': 4929, 'loss/train': 1.838969349861145} +11/06/2021 21:56:58 - INFO - __main__ - Step 4931: {'lr': 0.0004995166279126938, 'samples': 946752, 'steps': 4930, 'loss/train': 1.8372935056686401} +11/06/2021 21:56:58 - INFO - __main__ - Step 4932: {'lr': 0.0004995162980160283, 'samples': 946944, 'steps': 4931, 'loss/train': 1.7743967771530151} +11/06/2021 21:56:58 - INFO - __main__ - Step 4933: {'lr': 0.0004995159680069346, 'samples': 947136, 'steps': 4932, 'loss/train': 1.8914155960083008} +11/06/2021 21:56:59 - INFO - __main__ - Step 4934: {'lr': 0.0004995156378854127, 'samples': 947328, 'steps': 4933, 'loss/train': 1.7607487440109253} +11/06/2021 21:57:00 - INFO - __main__ - Step 4935: {'lr': 0.000499515307651463, 'samples': 947520, 'steps': 4934, 'loss/train': 2.1030728816986084} +11/06/2021 21:57:00 - INFO - __main__ - Step 4936: {'lr': 0.0004995149773050857, 'samples': 947712, 'steps': 4935, 'loss/train': 2.1479721069335938} +11/06/2021 21:57:01 - INFO - __main__ - Step 4937: {'lr': 0.0004995146468462806, 'samples': 947904, 'steps': 4936, 'loss/train': 1.576684832572937} +11/06/2021 21:57:01 - INFO - __main__ - Step 4938: {'lr': 0.0004995143162750481, 'samples': 948096, 'steps': 4937, 'loss/train': 2.200626850128174} +11/06/2021 21:57:02 - INFO - __main__ - Step 4939: {'lr': 0.0004995139855913883, 'samples': 948288, 'steps': 4938, 'loss/train': 2.6972954273223877} +11/06/2021 21:57:02 - INFO - __main__ - Step 4940: {'lr': 0.0004995136547953014, 'samples': 948480, 'steps': 4939, 'loss/train': 2.025506019592285} +11/06/2021 21:57:02 - INFO - __main__ - Step 4941: {'lr': 0.0004995133238867874, 'samples': 948672, 'steps': 4940, 'loss/train': 2.79832124710083} +11/06/2021 21:57:03 - INFO - __main__ - Step 4942: {'lr': 0.0004995129928658466, 'samples': 948864, 'steps': 4941, 'loss/train': 1.9636731147766113} +11/06/2021 21:57:03 - INFO - __main__ - Step 4943: {'lr': 0.0004995126617324791, 'samples': 949056, 'steps': 4942, 'loss/train': 2.302797317504883} +11/06/2021 21:57:04 - INFO - __main__ - Step 4944: {'lr': 0.000499512330486685, 'samples': 949248, 'steps': 4943, 'loss/train': 1.3910671472549438} +11/06/2021 21:57:05 - INFO - __main__ - Step 4945: {'lr': 0.0004995119991284645, 'samples': 949440, 'steps': 4944, 'loss/train': 1.6283067464828491} +11/06/2021 21:57:05 - INFO - __main__ - Step 4946: {'lr': 0.0004995116676578178, 'samples': 949632, 'steps': 4945, 'loss/train': 2.0636019706726074} +11/06/2021 21:57:05 - INFO - __main__ - Step 4947: {'lr': 0.000499511336074745, 'samples': 949824, 'steps': 4946, 'loss/train': 1.653847575187683} +11/06/2021 21:57:06 - INFO - __main__ - Step 4948: {'lr': 0.0004995110043792462, 'samples': 950016, 'steps': 4947, 'loss/train': 1.9270820617675781} +11/06/2021 21:57:06 - INFO - __main__ - Step 4949: {'lr': 0.0004995106725713217, 'samples': 950208, 'steps': 4948, 'loss/train': 2.0320072174072266} +11/06/2021 21:57:07 - INFO - __main__ - Step 4950: {'lr': 0.0004995103406509713, 'samples': 950400, 'steps': 4949, 'loss/train': 1.9087032079696655} +11/06/2021 21:57:07 - INFO - __main__ - Step 4951: {'lr': 0.0004995100086181957, 'samples': 950592, 'steps': 4950, 'loss/train': 2.294539451599121} +11/06/2021 21:57:08 - INFO - __main__ - Step 4952: {'lr': 0.0004995096764729945, 'samples': 950784, 'steps': 4951, 'loss/train': 1.427341341972351} +11/06/2021 21:57:08 - INFO - __main__ - Step 4953: {'lr': 0.0004995093442153681, 'samples': 950976, 'steps': 4952, 'loss/train': 1.223702073097229} +11/06/2021 21:57:09 - INFO - __main__ - Step 4954: {'lr': 0.0004995090118453167, 'samples': 951168, 'steps': 4953, 'loss/train': 1.9926605224609375} +11/06/2021 21:57:09 - INFO - __main__ - Step 4955: {'lr': 0.0004995086793628405, 'samples': 951360, 'steps': 4954, 'loss/train': 2.119666337966919} +11/06/2021 21:57:10 - INFO - __main__ - Step 4956: {'lr': 0.0004995083467679394, 'samples': 951552, 'steps': 4955, 'loss/train': 1.4242171049118042} +11/06/2021 21:57:10 - INFO - __main__ - Step 4957: {'lr': 0.0004995080140606137, 'samples': 951744, 'steps': 4956, 'loss/train': 2.439540147781372} +11/06/2021 21:57:11 - INFO - __main__ - Step 4958: {'lr': 0.0004995076812408636, 'samples': 951936, 'steps': 4957, 'loss/train': 1.9032562971115112} +11/06/2021 21:57:11 - INFO - __main__ - Step 4959: {'lr': 0.0004995073483086891, 'samples': 952128, 'steps': 4958, 'loss/train': 1.8582649230957031} +11/06/2021 21:57:12 - INFO - __main__ - Step 4960: {'lr': 0.0004995070152640905, 'samples': 952320, 'steps': 4959, 'loss/train': 2.372265100479126} +11/06/2021 21:57:12 - INFO - __main__ - Step 4961: {'lr': 0.0004995066821070679, 'samples': 952512, 'steps': 4960, 'loss/train': 1.438249945640564} +11/06/2021 21:57:13 - INFO - __main__ - Step 4962: {'lr': 0.0004995063488376214, 'samples': 952704, 'steps': 4961, 'loss/train': 2.022662401199341} +11/06/2021 21:57:13 - INFO - __main__ - Step 4963: {'lr': 0.0004995060154557513, 'samples': 952896, 'steps': 4962, 'loss/train': 2.1550307273864746} +11/06/2021 21:57:13 - INFO - __main__ - Step 4964: {'lr': 0.0004995056819614575, 'samples': 953088, 'steps': 4963, 'loss/train': 1.8373814821243286} +11/06/2021 21:57:14 - INFO - __main__ - Step 4965: {'lr': 0.0004995053483547404, 'samples': 953280, 'steps': 4964, 'loss/train': 2.0746841430664062} +11/06/2021 21:57:15 - INFO - __main__ - Step 4966: {'lr': 0.0004995050146355999, 'samples': 953472, 'steps': 4965, 'loss/train': 1.7231754064559937} +11/06/2021 21:57:15 - INFO - __main__ - Step 4967: {'lr': 0.0004995046808040363, 'samples': 953664, 'steps': 4966, 'loss/train': 2.3439464569091797} +11/06/2021 21:57:15 - INFO - __main__ - Step 4968: {'lr': 0.0004995043468600499, 'samples': 953856, 'steps': 4967, 'loss/train': 1.1684303283691406} +11/06/2021 21:57:16 - INFO - __main__ - Step 4969: {'lr': 0.0004995040128036405, 'samples': 954048, 'steps': 4968, 'loss/train': 1.818418264389038} +11/06/2021 21:57:16 - INFO - __main__ - Step 4970: {'lr': 0.0004995036786348086, 'samples': 954240, 'steps': 4969, 'loss/train': 2.059702157974243} +11/06/2021 21:57:17 - INFO - __main__ - Step 4971: {'lr': 0.0004995033443535541, 'samples': 954432, 'steps': 4970, 'loss/train': 1.7052550315856934} +11/06/2021 21:57:17 - INFO - __main__ - Step 4972: {'lr': 0.0004995030099598773, 'samples': 954624, 'steps': 4971, 'loss/train': 2.043684720993042} +11/06/2021 21:57:18 - INFO - __main__ - Step 4973: {'lr': 0.0004995026754537783, 'samples': 954816, 'steps': 4972, 'loss/train': 1.259334683418274} +11/06/2021 21:57:18 - INFO - __main__ - Step 4974: {'lr': 0.0004995023408352572, 'samples': 955008, 'steps': 4973, 'loss/train': 2.089118242263794} +11/06/2021 21:57:18 - INFO - __main__ - Step 4975: {'lr': 0.0004995020061043142, 'samples': 955200, 'steps': 4974, 'loss/train': 2.190615177154541} +11/06/2021 21:57:20 - INFO - __main__ - Step 4976: {'lr': 0.0004995016712609495, 'samples': 955392, 'steps': 4975, 'loss/train': 2.123932361602783} +11/06/2021 21:57:20 - INFO - __main__ - Step 4977: {'lr': 0.0004995013363051631, 'samples': 955584, 'steps': 4976, 'loss/train': 2.357672929763794} +11/06/2021 21:57:20 - INFO - __main__ - Step 4978: {'lr': 0.0004995010012369554, 'samples': 955776, 'steps': 4977, 'loss/train': 2.4011850357055664} +11/06/2021 21:57:21 - INFO - __main__ - Step 4979: {'lr': 0.0004995006660563262, 'samples': 955968, 'steps': 4978, 'loss/train': 2.2604053020477295} +11/06/2021 21:57:21 - INFO - __main__ - Step 4980: {'lr': 0.000499500330763276, 'samples': 956160, 'steps': 4979, 'loss/train': 1.697622537612915} +11/06/2021 21:57:22 - INFO - __main__ - Step 4981: {'lr': 0.0004994999953578048, 'samples': 956352, 'steps': 4980, 'loss/train': 2.418104887008667} +11/06/2021 21:57:22 - INFO - __main__ - Step 4982: {'lr': 0.0004994996598399127, 'samples': 956544, 'steps': 4981, 'loss/train': 1.7995312213897705} +11/06/2021 21:57:23 - INFO - __main__ - Step 4983: {'lr': 0.0004994993242095999, 'samples': 956736, 'steps': 4982, 'loss/train': 1.0818099975585938} +11/06/2021 21:57:23 - INFO - __main__ - Step 4984: {'lr': 0.0004994989884668665, 'samples': 956928, 'steps': 4983, 'loss/train': 1.7262250185012817} +11/06/2021 21:57:23 - INFO - __main__ - Step 4985: {'lr': 0.0004994986526117127, 'samples': 957120, 'steps': 4984, 'loss/train': 1.8972023725509644} +11/06/2021 21:57:24 - INFO - __main__ - Step 4986: {'lr': 0.0004994983166441388, 'samples': 957312, 'steps': 4985, 'loss/train': 1.5889555215835571} +11/06/2021 21:57:25 - INFO - __main__ - Step 4987: {'lr': 0.0004994979805641448, 'samples': 957504, 'steps': 4986, 'loss/train': 2.0608432292938232} +11/06/2021 21:57:25 - INFO - __main__ - Step 4988: {'lr': 0.0004994976443717308, 'samples': 957696, 'steps': 4987, 'loss/train': 2.1303555965423584} +11/06/2021 21:57:25 - INFO - __main__ - Step 4989: {'lr': 0.000499497308066897, 'samples': 957888, 'steps': 4988, 'loss/train': 1.3450038433074951} +11/06/2021 21:57:26 - INFO - __main__ - Step 4990: {'lr': 0.0004994969716496435, 'samples': 958080, 'steps': 4989, 'loss/train': 1.9656953811645508} +11/06/2021 21:57:27 - INFO - __main__ - Step 4991: {'lr': 0.0004994966351199706, 'samples': 958272, 'steps': 4990, 'loss/train': 1.8768229484558105} +11/06/2021 21:57:27 - INFO - __main__ - Step 4992: {'lr': 0.0004994962984778784, 'samples': 958464, 'steps': 4991, 'loss/train': 0.9767778515815735} +11/06/2021 21:57:27 - INFO - __main__ - Step 4993: {'lr': 0.0004994959617233669, 'samples': 958656, 'steps': 4992, 'loss/train': 1.952646255493164} +11/06/2021 21:57:28 - INFO - __main__ - Step 4994: {'lr': 0.0004994956248564364, 'samples': 958848, 'steps': 4993, 'loss/train': 2.012577533721924} +11/06/2021 21:57:28 - INFO - __main__ - Step 4995: {'lr': 0.000499495287877087, 'samples': 959040, 'steps': 4994, 'loss/train': 2.6770846843719482} +11/06/2021 21:57:29 - INFO - __main__ - Step 4996: {'lr': 0.000499494950785319, 'samples': 959232, 'steps': 4995, 'loss/train': 0.9503514766693115} +11/06/2021 21:57:30 - INFO - __main__ - Step 4997: {'lr': 0.0004994946135811324, 'samples': 959424, 'steps': 4996, 'loss/train': 1.3578064441680908} +11/06/2021 21:57:30 - INFO - __main__ - Step 4998: {'lr': 0.0004994942762645274, 'samples': 959616, 'steps': 4997, 'loss/train': 1.6439087390899658} +11/06/2021 21:57:30 - INFO - __main__ - Step 4999: {'lr': 0.000499493938835504, 'samples': 959808, 'steps': 4998, 'loss/train': 1.955640196800232} +11/06/2021 21:57:31 - INFO - __main__ - Step 5000: {'lr': 0.0004994936012940626, 'samples': 960000, 'steps': 4999, 'loss/train': 2.0416653156280518} +11/06/2021 21:57:32 - INFO - __main__ - Step 5001: {'lr': 0.0004994932636402031, 'samples': 960192, 'steps': 5000, 'loss/train': 2.211860418319702} +11/06/2021 21:57:32 - INFO - __main__ - Step 5002: {'lr': 0.000499492925873926, 'samples': 960384, 'steps': 5001, 'loss/train': 2.095062017440796} +11/06/2021 21:57:33 - INFO - __main__ - Step 5003: {'lr': 0.000499492587995231, 'samples': 960576, 'steps': 5002, 'loss/train': 2.049713611602783} +11/06/2021 21:57:33 - INFO - __main__ - Step 5004: {'lr': 0.0004994922500041186, 'samples': 960768, 'steps': 5003, 'loss/train': 1.5910391807556152} +11/06/2021 21:57:33 - INFO - __main__ - Step 5005: {'lr': 0.0004994919119005888, 'samples': 960960, 'steps': 5004, 'loss/train': 2.3668973445892334} +11/06/2021 21:57:34 - INFO - __main__ - Step 5006: {'lr': 0.0004994915736846418, 'samples': 961152, 'steps': 5005, 'loss/train': 2.0674057006835938} +11/06/2021 21:57:35 - INFO - __main__ - Step 5007: {'lr': 0.0004994912353562778, 'samples': 961344, 'steps': 5006, 'loss/train': 2.0364692211151123} +11/06/2021 21:57:35 - INFO - __main__ - Step 5008: {'lr': 0.0004994908969154968, 'samples': 961536, 'steps': 5007, 'loss/train': 1.763395071029663} +11/06/2021 21:57:36 - INFO - __main__ - Step 5009: {'lr': 0.0004994905583622992, 'samples': 961728, 'steps': 5008, 'loss/train': 1.6759827136993408} +11/06/2021 21:57:36 - INFO - __main__ - Step 5010: {'lr': 0.000499490219696685, 'samples': 961920, 'steps': 5009, 'loss/train': 1.3407360315322876} +11/06/2021 21:57:36 - INFO - __main__ - Step 5011: {'lr': 0.0004994898809186542, 'samples': 962112, 'steps': 5010, 'loss/train': 2.153372049331665} +11/06/2021 21:57:37 - INFO - __main__ - Step 5012: {'lr': 0.0004994895420282072, 'samples': 962304, 'steps': 5011, 'loss/train': 2.228909969329834} +11/06/2021 21:57:38 - INFO - __main__ - Step 5013: {'lr': 0.000499489203025344, 'samples': 962496, 'steps': 5012, 'loss/train': 1.8992091417312622} +11/06/2021 21:57:38 - INFO - __main__ - Step 5014: {'lr': 0.000499488863910065, 'samples': 962688, 'steps': 5013, 'loss/train': 1.6911919116973877} +11/06/2021 21:57:38 - INFO - __main__ - Step 5015: {'lr': 0.00049948852468237, 'samples': 962880, 'steps': 5014, 'loss/train': 1.5895403623580933} +11/06/2021 21:57:39 - INFO - __main__ - Step 5016: {'lr': 0.0004994881853422594, 'samples': 963072, 'steps': 5015, 'loss/train': 1.8377931118011475} +11/06/2021 21:57:40 - INFO - __main__ - Step 5017: {'lr': 0.0004994878458897332, 'samples': 963264, 'steps': 5016, 'loss/train': 2.5478765964508057} +11/06/2021 21:57:40 - INFO - __main__ - Step 5018: {'lr': 0.0004994875063247916, 'samples': 963456, 'steps': 5017, 'loss/train': 1.8936893939971924} +11/06/2021 21:57:41 - INFO - __main__ - Step 5019: {'lr': 0.0004994871666474348, 'samples': 963648, 'steps': 5018, 'loss/train': 2.324462890625} +11/06/2021 21:57:41 - INFO - __main__ - Step 5020: {'lr': 0.000499486826857663, 'samples': 963840, 'steps': 5019, 'loss/train': 1.8107075691223145} +11/06/2021 21:57:41 - INFO - __main__ - Step 5021: {'lr': 0.0004994864869554763, 'samples': 964032, 'steps': 5020, 'loss/train': 1.989519476890564} +11/06/2021 21:57:42 - INFO - __main__ - Step 5022: {'lr': 0.0004994861469408748, 'samples': 964224, 'steps': 5021, 'loss/train': 1.991037368774414} +11/06/2021 21:57:43 - INFO - __main__ - Step 5023: {'lr': 0.0004994858068138587, 'samples': 964416, 'steps': 5022, 'loss/train': 1.7982574701309204} +11/06/2021 21:57:43 - INFO - __main__ - Step 5024: {'lr': 0.0004994854665744282, 'samples': 964608, 'steps': 5023, 'loss/train': 2.380490303039551} +11/06/2021 21:57:43 - INFO - __main__ - Step 5025: {'lr': 0.0004994851262225832, 'samples': 964800, 'steps': 5024, 'loss/train': 1.3919230699539185} +11/06/2021 21:57:44 - INFO - __main__ - Step 5026: {'lr': 0.0004994847857583242, 'samples': 964992, 'steps': 5025, 'loss/train': 2.2827370166778564} +11/06/2021 21:57:45 - INFO - __main__ - Step 5027: {'lr': 0.0004994844451816512, 'samples': 965184, 'steps': 5026, 'loss/train': 2.1347203254699707} +11/06/2021 21:57:45 - INFO - __main__ - Step 5028: {'lr': 0.0004994841044925644, 'samples': 965376, 'steps': 5027, 'loss/train': 1.6065678596496582} +11/06/2021 21:57:45 - INFO - __main__ - Step 5029: {'lr': 0.0004994837636910638, 'samples': 965568, 'steps': 5028, 'loss/train': 1.7136719226837158} +11/06/2021 21:57:46 - INFO - __main__ - Step 5030: {'lr': 0.0004994834227771498, 'samples': 965760, 'steps': 5029, 'loss/train': 2.129387617111206} +11/06/2021 21:57:46 - INFO - __main__ - Step 5031: {'lr': 0.0004994830817508224, 'samples': 965952, 'steps': 5030, 'loss/train': 2.3650991916656494} +11/06/2021 21:57:47 - INFO - __main__ - Step 5032: {'lr': 0.0004994827406120816, 'samples': 966144, 'steps': 5031, 'loss/train': 1.8486300706863403} +11/06/2021 21:57:47 - INFO - __main__ - Step 5033: {'lr': 0.0004994823993609279, 'samples': 966336, 'steps': 5032, 'loss/train': 0.8590723872184753} +11/06/2021 21:57:48 - INFO - __main__ - Step 5034: {'lr': 0.0004994820579973612, 'samples': 966528, 'steps': 5033, 'loss/train': 1.7398724555969238} +11/06/2021 21:57:48 - INFO - __main__ - Step 5035: {'lr': 0.0004994817165213817, 'samples': 966720, 'steps': 5034, 'loss/train': 2.0410008430480957} +11/06/2021 21:57:48 - INFO - __main__ - Step 5036: {'lr': 0.0004994813749329897, 'samples': 966912, 'steps': 5035, 'loss/train': 1.631545066833496} +11/06/2021 21:57:50 - INFO - __main__ - Step 5037: {'lr': 0.0004994810332321852, 'samples': 967104, 'steps': 5036, 'loss/train': 1.492642879486084} +11/06/2021 21:57:50 - INFO - __main__ - Step 5038: {'lr': 0.0004994806914189684, 'samples': 967296, 'steps': 5037, 'loss/train': 2.159714460372925} +11/06/2021 21:57:50 - INFO - __main__ - Step 5039: {'lr': 0.0004994803494933394, 'samples': 967488, 'steps': 5038, 'loss/train': 2.5530550479888916} +11/06/2021 21:57:51 - INFO - __main__ - Step 5040: {'lr': 0.0004994800074552985, 'samples': 967680, 'steps': 5039, 'loss/train': 1.7678231000900269} +11/06/2021 21:57:51 - INFO - __main__ - Step 5041: {'lr': 0.0004994796653048457, 'samples': 967872, 'steps': 5040, 'loss/train': 2.178983211517334} +11/06/2021 21:57:51 - INFO - __main__ - Step 5042: {'lr': 0.0004994793230419812, 'samples': 968064, 'steps': 5041, 'loss/train': 2.832493305206299} +11/06/2021 21:57:52 - INFO - __main__ - Step 5043: {'lr': 0.0004994789806667052, 'samples': 968256, 'steps': 5042, 'loss/train': 1.9693965911865234} +11/06/2021 21:57:53 - INFO - __main__ - Step 5044: {'lr': 0.0004994786381790178, 'samples': 968448, 'steps': 5043, 'loss/train': 1.6492239236831665} +11/06/2021 21:57:53 - INFO - __main__ - Step 5045: {'lr': 0.0004994782955789191, 'samples': 968640, 'steps': 5044, 'loss/train': 1.885124683380127} +11/06/2021 21:57:53 - INFO - __main__ - Step 5046: {'lr': 0.0004994779528664095, 'samples': 968832, 'steps': 5045, 'loss/train': 2.0043511390686035} +11/06/2021 21:57:54 - INFO - __main__ - Step 5047: {'lr': 0.0004994776100414888, 'samples': 969024, 'steps': 5046, 'loss/train': 2.129291534423828} +11/06/2021 21:57:55 - INFO - __main__ - Step 5048: {'lr': 0.0004994772671041575, 'samples': 969216, 'steps': 5047, 'loss/train': 2.2023603916168213} +11/06/2021 21:57:55 - INFO - __main__ - Step 5049: {'lr': 0.0004994769240544155, 'samples': 969408, 'steps': 5048, 'loss/train': 2.209613084793091} +11/06/2021 21:57:55 - INFO - __main__ - Step 5050: {'lr': 0.000499476580892263, 'samples': 969600, 'steps': 5049, 'loss/train': 1.4724314212799072} +11/06/2021 21:57:56 - INFO - __main__ - Step 5051: {'lr': 0.0004994762376177004, 'samples': 969792, 'steps': 5050, 'loss/train': 2.012944459915161} +11/06/2021 21:57:56 - INFO - __main__ - Step 5052: {'lr': 0.0004994758942307274, 'samples': 969984, 'steps': 5051, 'loss/train': 1.9832876920700073} +11/06/2021 21:57:57 - INFO - __main__ - Step 5053: {'lr': 0.0004994755507313446, 'samples': 970176, 'steps': 5052, 'loss/train': 2.164370536804199} +11/06/2021 21:57:58 - INFO - __main__ - Step 5054: {'lr': 0.000499475207119552, 'samples': 970368, 'steps': 5053, 'loss/train': 2.118231773376465} +11/06/2021 21:57:58 - INFO - __main__ - Step 5055: {'lr': 0.0004994748633953495, 'samples': 970560, 'steps': 5054, 'loss/train': 1.800482153892517} +11/06/2021 21:57:58 - INFO - __main__ - Step 5056: {'lr': 0.0004994745195587376, 'samples': 970752, 'steps': 5055, 'loss/train': 2.163815975189209} +11/06/2021 21:57:59 - INFO - __main__ - Step 5057: {'lr': 0.0004994741756097164, 'samples': 970944, 'steps': 5056, 'loss/train': 2.414111852645874} +11/06/2021 21:58:00 - INFO - __main__ - Step 5058: {'lr': 0.0004994738315482859, 'samples': 971136, 'steps': 5057, 'loss/train': 1.5080969333648682} +11/06/2021 21:58:00 - INFO - __main__ - Step 5059: {'lr': 0.0004994734873744464, 'samples': 971328, 'steps': 5058, 'loss/train': 2.688166379928589} +11/06/2021 21:58:00 - INFO - __main__ - Step 5060: {'lr': 0.0004994731430881979, 'samples': 971520, 'steps': 5059, 'loss/train': 2.305680990219116} +11/06/2021 21:58:01 - INFO - __main__ - Step 5061: {'lr': 0.0004994727986895408, 'samples': 971712, 'steps': 5060, 'loss/train': 1.9738892316818237} +11/06/2021 21:58:01 - INFO - __main__ - Step 5062: {'lr': 0.0004994724541784749, 'samples': 971904, 'steps': 5061, 'loss/train': 2.3541839122772217} +11/06/2021 21:58:02 - INFO - __main__ - Step 5063: {'lr': 0.0004994721095550008, 'samples': 972096, 'steps': 5062, 'loss/train': 1.869810938835144} +11/06/2021 21:58:02 - INFO - __main__ - Step 5064: {'lr': 0.0004994717648191182, 'samples': 972288, 'steps': 5063, 'loss/train': 1.6675723791122437} +11/06/2021 21:58:03 - INFO - __main__ - Step 5065: {'lr': 0.0004994714199708276, 'samples': 972480, 'steps': 5064, 'loss/train': 0.3723197877407074} +11/06/2021 21:58:03 - INFO - __main__ - Step 5066: {'lr': 0.000499471075010129, 'samples': 972672, 'steps': 5065, 'loss/train': 6.243468761444092} +11/06/2021 21:58:03 - INFO - __main__ - Step 5067: {'lr': 0.0004994707299370226, 'samples': 972864, 'steps': 5066, 'loss/train': 2.330059051513672} +11/06/2021 21:58:04 - INFO - __main__ - Step 5068: {'lr': 0.0004994703847515084, 'samples': 973056, 'steps': 5067, 'loss/train': 1.0603464841842651} +11/06/2021 21:58:05 - INFO - __main__ - Step 5069: {'lr': 0.0004994700394535869, 'samples': 973248, 'steps': 5068, 'loss/train': 2.0306475162506104} +11/06/2021 21:58:05 - INFO - __main__ - Step 5070: {'lr': 0.000499469694043258, 'samples': 973440, 'steps': 5069, 'loss/train': 2.2023260593414307} +11/06/2021 21:58:06 - INFO - __main__ - Step 5071: {'lr': 0.0004994693485205218, 'samples': 973632, 'steps': 5070, 'loss/train': 1.8960644006729126} +11/06/2021 21:58:06 - INFO - __main__ - Step 5072: {'lr': 0.0004994690028853787, 'samples': 973824, 'steps': 5071, 'loss/train': 1.8335449695587158} +11/06/2021 21:58:07 - INFO - __main__ - Step 5073: {'lr': 0.0004994686571378286, 'samples': 974016, 'steps': 5072, 'loss/train': 0.4239940643310547} +11/06/2021 21:58:08 - INFO - __main__ - Step 5074: {'lr': 0.0004994683112778718, 'samples': 974208, 'steps': 5073, 'loss/train': 1.9211030006408691} +11/06/2021 21:58:08 - INFO - __main__ - Step 5075: {'lr': 0.0004994679653055085, 'samples': 974400, 'steps': 5074, 'loss/train': 2.271078109741211} +11/06/2021 21:58:08 - INFO - __main__ - Step 5076: {'lr': 0.0004994676192207387, 'samples': 974592, 'steps': 5075, 'loss/train': 1.9957528114318848} +11/06/2021 21:58:09 - INFO - __main__ - Step 5077: {'lr': 0.0004994672730235626, 'samples': 974784, 'steps': 5076, 'loss/train': 2.396184206008911} +11/06/2021 21:58:09 - INFO - __main__ - Step 5078: {'lr': 0.0004994669267139806, 'samples': 974976, 'steps': 5077, 'loss/train': 2.0437135696411133} +11/06/2021 21:58:10 - INFO - __main__ - Step 5079: {'lr': 0.0004994665802919925, 'samples': 975168, 'steps': 5078, 'loss/train': 2.0462563037872314} +11/06/2021 21:58:11 - INFO - __main__ - Step 5080: {'lr': 0.0004994662337575986, 'samples': 975360, 'steps': 5079, 'loss/train': 2.834306478500366} +11/06/2021 21:58:11 - INFO - __main__ - Step 5081: {'lr': 0.000499465887110799, 'samples': 975552, 'steps': 5080, 'loss/train': 2.6196563243865967} +11/06/2021 21:58:11 - INFO - __main__ - Step 5082: {'lr': 0.0004994655403515941, 'samples': 975744, 'steps': 5081, 'loss/train': 1.8559695482254028} +11/06/2021 21:58:12 - INFO - __main__ - Step 5083: {'lr': 0.0004994651934799837, 'samples': 975936, 'steps': 5082, 'loss/train': 2.3033602237701416} +11/06/2021 21:58:12 - INFO - __main__ - Step 5084: {'lr': 0.0004994648464959683, 'samples': 976128, 'steps': 5083, 'loss/train': 1.8257298469543457} +11/06/2021 21:58:13 - INFO - __main__ - Step 5085: {'lr': 0.0004994644993995478, 'samples': 976320, 'steps': 5084, 'loss/train': 2.538905143737793} +11/06/2021 21:58:13 - INFO - __main__ - Step 5086: {'lr': 0.0004994641521907224, 'samples': 976512, 'steps': 5085, 'loss/train': 2.443490743637085} +11/06/2021 21:58:14 - INFO - __main__ - Step 5087: {'lr': 0.0004994638048694924, 'samples': 976704, 'steps': 5086, 'loss/train': 2.3946332931518555} +11/06/2021 21:58:14 - INFO - __main__ - Step 5088: {'lr': 0.0004994634574358579, 'samples': 976896, 'steps': 5087, 'loss/train': 1.450162649154663} +11/06/2021 21:58:14 - INFO - __main__ - Step 5089: {'lr': 0.0004994631098898188, 'samples': 977088, 'steps': 5088, 'loss/train': 1.5360685586929321} +11/06/2021 21:58:15 - INFO - __main__ - Step 5090: {'lr': 0.0004994627622313757, 'samples': 977280, 'steps': 5089, 'loss/train': 1.8420456647872925} +11/06/2021 21:58:16 - INFO - __main__ - Step 5091: {'lr': 0.0004994624144605284, 'samples': 977472, 'steps': 5090, 'loss/train': 2.4474048614501953} +11/06/2021 21:58:16 - INFO - __main__ - Step 5092: {'lr': 0.0004994620665772772, 'samples': 977664, 'steps': 5091, 'loss/train': 1.8615306615829468} +11/06/2021 21:58:16 - INFO - __main__ - Step 5093: {'lr': 0.0004994617185816222, 'samples': 977856, 'steps': 5092, 'loss/train': 2.000317335128784} +11/06/2021 21:58:17 - INFO - __main__ - Step 5094: {'lr': 0.0004994613704735638, 'samples': 978048, 'steps': 5093, 'loss/train': 2.3359320163726807} +11/06/2021 21:58:18 - INFO - __main__ - Step 5095: {'lr': 0.0004994610222531018, 'samples': 978240, 'steps': 5094, 'loss/train': 2.213413953781128} +11/06/2021 21:58:18 - INFO - __main__ - Step 5096: {'lr': 0.0004994606739202365, 'samples': 978432, 'steps': 5095, 'loss/train': 2.049318552017212} +11/06/2021 21:58:19 - INFO - __main__ - Step 5097: {'lr': 0.0004994603254749681, 'samples': 978624, 'steps': 5096, 'loss/train': 2.276933431625366} +11/06/2021 21:58:19 - INFO - __main__ - Step 5098: {'lr': 0.0004994599769172967, 'samples': 978816, 'steps': 5097, 'loss/train': 2.2054691314697266} +11/06/2021 21:58:19 - INFO - __main__ - Step 5099: {'lr': 0.0004994596282472225, 'samples': 979008, 'steps': 5098, 'loss/train': 1.958910346031189} +11/06/2021 21:58:20 - INFO - __main__ - Step 5100: {'lr': 0.0004994592794647457, 'samples': 979200, 'steps': 5099, 'loss/train': 2.0862319469451904} +11/06/2021 21:58:21 - INFO - __main__ - Step 5101: {'lr': 0.0004994589305698663, 'samples': 979392, 'steps': 5100, 'loss/train': 1.7089622020721436} +11/06/2021 21:58:21 - INFO - __main__ - Step 5102: {'lr': 0.0004994585815625847, 'samples': 979584, 'steps': 5101, 'loss/train': 1.952847957611084} +11/06/2021 21:58:21 - INFO - __main__ - Step 5103: {'lr': 0.0004994582324429008, 'samples': 979776, 'steps': 5102, 'loss/train': 1.894245982170105} +11/06/2021 21:58:22 - INFO - __main__ - Step 5104: {'lr': 0.0004994578832108148, 'samples': 979968, 'steps': 5103, 'loss/train': 1.3645782470703125} +11/06/2021 21:58:22 - INFO - __main__ - Step 5105: {'lr': 0.000499457533866327, 'samples': 980160, 'steps': 5104, 'loss/train': 2.4554972648620605} +11/06/2021 21:58:23 - INFO - __main__ - Step 5106: {'lr': 0.0004994571844094375, 'samples': 980352, 'steps': 5105, 'loss/train': 2.340075731277466} +11/06/2021 21:58:23 - INFO - __main__ - Step 5107: {'lr': 0.0004994568348401466, 'samples': 980544, 'steps': 5106, 'loss/train': 1.1222628355026245} +11/06/2021 21:58:24 - INFO - __main__ - Step 5108: {'lr': 0.0004994564851584541, 'samples': 980736, 'steps': 5107, 'loss/train': 1.5331889390945435} +11/06/2021 21:58:24 - INFO - __main__ - Step 5109: {'lr': 0.0004994561353643604, 'samples': 980928, 'steps': 5108, 'loss/train': 1.8134424686431885} +11/06/2021 21:58:25 - INFO - __main__ - Step 5110: {'lr': 0.0004994557854578656, 'samples': 981120, 'steps': 5109, 'loss/train': 1.9003137350082397} +11/06/2021 21:58:26 - INFO - __main__ - Step 5111: {'lr': 0.0004994554354389699, 'samples': 981312, 'steps': 5110, 'loss/train': 1.9330469369888306} +11/06/2021 21:58:26 - INFO - __main__ - Step 5112: {'lr': 0.0004994550853076734, 'samples': 981504, 'steps': 5111, 'loss/train': 1.9353581666946411} +11/06/2021 21:58:27 - INFO - __main__ - Step 5113: {'lr': 0.0004994547350639764, 'samples': 981696, 'steps': 5112, 'loss/train': 2.078845500946045} +11/06/2021 21:58:27 - INFO - __main__ - Step 5114: {'lr': 0.0004994543847078787, 'samples': 981888, 'steps': 5113, 'loss/train': 1.3129998445510864} +11/06/2021 21:58:27 - INFO - __main__ - Step 5115: {'lr': 0.000499454034239381, 'samples': 982080, 'steps': 5114, 'loss/train': 1.7932987213134766} +11/06/2021 21:58:28 - INFO - __main__ - Step 5116: {'lr': 0.000499453683658483, 'samples': 982272, 'steps': 5115, 'loss/train': 2.2063400745391846} +11/06/2021 21:58:28 - INFO - __main__ - Step 5117: {'lr': 0.0004994533329651849, 'samples': 982464, 'steps': 5116, 'loss/train': 1.820799469947815} +11/06/2021 21:58:29 - INFO - __main__ - Step 5118: {'lr': 0.0004994529821594872, 'samples': 982656, 'steps': 5117, 'loss/train': 2.5855801105499268} +11/06/2021 21:58:29 - INFO - __main__ - Step 5119: {'lr': 0.0004994526312413897, 'samples': 982848, 'steps': 5118, 'loss/train': 1.6690380573272705} +11/06/2021 21:58:30 - INFO - __main__ - Step 5120: {'lr': 0.0004994522802108927, 'samples': 983040, 'steps': 5119, 'loss/train': 1.896449327468872} +11/06/2021 21:58:30 - INFO - __main__ - Step 5121: {'lr': 0.0004994519290679964, 'samples': 983232, 'steps': 5120, 'loss/train': 1.6968704462051392} +11/06/2021 21:58:31 - INFO - __main__ - Step 5122: {'lr': 0.0004994515778127009, 'samples': 983424, 'steps': 5121, 'loss/train': 1.7569773197174072} +11/06/2021 21:58:31 - INFO - __main__ - Step 5123: {'lr': 0.0004994512264450064, 'samples': 983616, 'steps': 5122, 'loss/train': 2.063852310180664} +11/06/2021 21:58:32 - INFO - __main__ - Step 5124: {'lr': 0.000499450874964913, 'samples': 983808, 'steps': 5123, 'loss/train': 2.1291959285736084} +11/06/2021 21:58:32 - INFO - __main__ - Step 5125: {'lr': 0.000499450523372421, 'samples': 984000, 'steps': 5124, 'loss/train': 2.469874143600464} +11/06/2021 21:58:32 - INFO - __main__ - Step 5126: {'lr': 0.0004994501716675303, 'samples': 984192, 'steps': 5125, 'loss/train': 1.7951209545135498} +11/06/2021 21:58:33 - INFO - __main__ - Step 5127: {'lr': 0.0004994498198502412, 'samples': 984384, 'steps': 5126, 'loss/train': 2.0104482173919678} +11/06/2021 21:58:34 - INFO - __main__ - Step 5128: {'lr': 0.0004994494679205539, 'samples': 984576, 'steps': 5127, 'loss/train': 2.0760858058929443} +11/06/2021 21:58:34 - INFO - __main__ - Step 5129: {'lr': 0.0004994491158784684, 'samples': 984768, 'steps': 5128, 'loss/train': 2.1686079502105713} +11/06/2021 21:58:34 - INFO - __main__ - Step 5130: {'lr': 0.0004994487637239851, 'samples': 984960, 'steps': 5129, 'loss/train': 1.1807832717895508} +11/06/2021 21:58:35 - INFO - __main__ - Step 5131: {'lr': 0.0004994484114571041, 'samples': 985152, 'steps': 5130, 'loss/train': 1.4355896711349487} +11/06/2021 21:58:36 - INFO - __main__ - Step 5132: {'lr': 0.0004994480590778254, 'samples': 985344, 'steps': 5131, 'loss/train': 1.8569763898849487} +11/06/2021 21:58:36 - INFO - __main__ - Step 5133: {'lr': 0.0004994477065861493, 'samples': 985536, 'steps': 5132, 'loss/train': 2.1365954875946045} +11/06/2021 21:58:37 - INFO - __main__ - Step 5134: {'lr': 0.0004994473539820758, 'samples': 985728, 'steps': 5133, 'loss/train': 1.7661622762680054} +11/06/2021 21:58:37 - INFO - __main__ - Step 5135: {'lr': 0.0004994470012656052, 'samples': 985920, 'steps': 5134, 'loss/train': 2.2697160243988037} +11/06/2021 21:58:37 - INFO - __main__ - Step 5136: {'lr': 0.0004994466484367378, 'samples': 986112, 'steps': 5135, 'loss/train': 2.3424150943756104} +11/06/2021 21:58:38 - INFO - __main__ - Step 5137: {'lr': 0.0004994462954954734, 'samples': 986304, 'steps': 5136, 'loss/train': 1.250626564025879} +11/06/2021 21:58:39 - INFO - __main__ - Step 5138: {'lr': 0.0004994459424418125, 'samples': 986496, 'steps': 5137, 'loss/train': 2.22953462600708} +11/06/2021 21:58:39 - INFO - __main__ - Step 5139: {'lr': 0.000499445589275755, 'samples': 986688, 'steps': 5138, 'loss/train': 2.005419969558716} +11/06/2021 21:58:39 - INFO - __main__ - Step 5140: {'lr': 0.0004994452359973012, 'samples': 986880, 'steps': 5139, 'loss/train': 1.6053614616394043} +11/06/2021 21:58:40 - INFO - __main__ - Step 5141: {'lr': 0.0004994448826064512, 'samples': 987072, 'steps': 5140, 'loss/train': 2.132984161376953} +11/06/2021 21:58:41 - INFO - __main__ - Step 5142: {'lr': 0.0004994445291032053, 'samples': 987264, 'steps': 5141, 'loss/train': 1.4963831901550293} +11/06/2021 21:58:41 - INFO - __main__ - Step 5143: {'lr': 0.0004994441754875634, 'samples': 987456, 'steps': 5142, 'loss/train': 2.0756425857543945} +11/06/2021 21:58:41 - INFO - __main__ - Step 5144: {'lr': 0.0004994438217595259, 'samples': 987648, 'steps': 5143, 'loss/train': 2.1674396991729736} +11/06/2021 21:58:42 - INFO - __main__ - Step 5145: {'lr': 0.0004994434679190928, 'samples': 987840, 'steps': 5144, 'loss/train': 2.1360890865325928} +11/06/2021 21:58:42 - INFO - __main__ - Step 5146: {'lr': 0.0004994431139662643, 'samples': 988032, 'steps': 5145, 'loss/train': 2.855836868286133} +11/06/2021 21:58:43 - INFO - __main__ - Step 5147: {'lr': 0.0004994427599010406, 'samples': 988224, 'steps': 5146, 'loss/train': 2.0516815185546875} +11/06/2021 21:58:44 - INFO - __main__ - Step 5148: {'lr': 0.0004994424057234219, 'samples': 988416, 'steps': 5147, 'loss/train': 1.951188087463379} +11/06/2021 21:58:45 - INFO - __main__ - Step 5149: {'lr': 0.0004994420514334082, 'samples': 988608, 'steps': 5148, 'loss/train': 1.9776523113250732} +11/06/2021 21:58:45 - INFO - __main__ - Step 5150: {'lr': 0.0004994416970309999, 'samples': 988800, 'steps': 5149, 'loss/train': 2.2853457927703857} +11/06/2021 21:58:45 - INFO - __main__ - Step 5151: {'lr': 0.0004994413425161969, 'samples': 988992, 'steps': 5150, 'loss/train': 1.2515465021133423} +11/06/2021 21:58:46 - INFO - __main__ - Step 5152: {'lr': 0.0004994409878889995, 'samples': 989184, 'steps': 5151, 'loss/train': 1.107923984527588} +11/06/2021 21:58:46 - INFO - __main__ - Step 5153: {'lr': 0.0004994406331494079, 'samples': 989376, 'steps': 5152, 'loss/train': 0.8732290267944336} +11/06/2021 21:58:47 - INFO - __main__ - Step 5154: {'lr': 0.0004994402782974222, 'samples': 989568, 'steps': 5153, 'loss/train': 1.9641544818878174} +11/06/2021 21:58:47 - INFO - __main__ - Step 5155: {'lr': 0.0004994399233330426, 'samples': 989760, 'steps': 5154, 'loss/train': 2.2096810340881348} +11/06/2021 21:58:48 - INFO - __main__ - Step 5156: {'lr': 0.000499439568256269, 'samples': 989952, 'steps': 5155, 'loss/train': 1.8779668807983398} +11/06/2021 21:58:48 - INFO - __main__ - Step 5157: {'lr': 0.000499439213067102, 'samples': 990144, 'steps': 5156, 'loss/train': 2.0117697715759277} +11/06/2021 21:58:48 - INFO - __main__ - Step 5158: {'lr': 0.0004994388577655415, 'samples': 990336, 'steps': 5157, 'loss/train': 1.9738129377365112} +11/06/2021 21:58:49 - INFO - __main__ - Step 5159: {'lr': 0.0004994385023515876, 'samples': 990528, 'steps': 5158, 'loss/train': 2.6475677490234375} +11/06/2021 21:58:50 - INFO - __main__ - Step 5160: {'lr': 0.0004994381468252406, 'samples': 990720, 'steps': 5159, 'loss/train': 2.463541269302368} +11/06/2021 21:58:50 - INFO - __main__ - Step 5161: {'lr': 0.0004994377911865007, 'samples': 990912, 'steps': 5160, 'loss/train': 2.4826114177703857} +11/06/2021 21:58:51 - INFO - __main__ - Step 5162: {'lr': 0.0004994374354353679, 'samples': 991104, 'steps': 5161, 'loss/train': 2.0047404766082764} +11/06/2021 21:58:51 - INFO - __main__ - Step 5163: {'lr': 0.0004994370795718425, 'samples': 991296, 'steps': 5162, 'loss/train': 2.0610859394073486} +11/06/2021 21:58:51 - INFO - __main__ - Step 5164: {'lr': 0.0004994367235959245, 'samples': 991488, 'steps': 5163, 'loss/train': 1.4020670652389526} +11/06/2021 21:58:52 - INFO - __main__ - Step 5165: {'lr': 0.0004994363675076143, 'samples': 991680, 'steps': 5164, 'loss/train': 1.8617390394210815} +11/06/2021 21:58:53 - INFO - __main__ - Step 5166: {'lr': 0.0004994360113069118, 'samples': 991872, 'steps': 5165, 'loss/train': 2.2617647647857666} +11/06/2021 21:58:53 - INFO - __main__ - Step 5167: {'lr': 0.0004994356549938173, 'samples': 992064, 'steps': 5166, 'loss/train': 2.5071494579315186} +11/06/2021 21:58:53 - INFO - __main__ - Step 5168: {'lr': 0.000499435298568331, 'samples': 992256, 'steps': 5167, 'loss/train': 2.4085593223571777} +11/06/2021 21:58:54 - INFO - __main__ - Step 5169: {'lr': 0.000499434942030453, 'samples': 992448, 'steps': 5168, 'loss/train': 1.7436469793319702} +11/06/2021 21:58:55 - INFO - __main__ - Step 5170: {'lr': 0.0004994345853801834, 'samples': 992640, 'steps': 5169, 'loss/train': 1.887163758277893} +11/06/2021 21:58:55 - INFO - __main__ - Step 5171: {'lr': 0.0004994342286175225, 'samples': 992832, 'steps': 5170, 'loss/train': 1.4238390922546387} +11/06/2021 21:58:56 - INFO - __main__ - Step 5172: {'lr': 0.0004994338717424704, 'samples': 993024, 'steps': 5171, 'loss/train': 1.6073421239852905} +11/06/2021 21:58:56 - INFO - __main__ - Step 5173: {'lr': 0.0004994335147550272, 'samples': 993216, 'steps': 5172, 'loss/train': 2.328388214111328} +11/06/2021 21:58:56 - INFO - __main__ - Step 5174: {'lr': 0.0004994331576551931, 'samples': 993408, 'steps': 5173, 'loss/train': 2.2518372535705566} +11/06/2021 21:58:57 - INFO - __main__ - Step 5175: {'lr': 0.0004994328004429683, 'samples': 993600, 'steps': 5174, 'loss/train': 1.5607566833496094} +11/06/2021 21:58:58 - INFO - __main__ - Step 5176: {'lr': 0.000499432443118353, 'samples': 993792, 'steps': 5175, 'loss/train': 2.3936564922332764} +11/06/2021 21:58:58 - INFO - __main__ - Step 5177: {'lr': 0.0004994320856813471, 'samples': 993984, 'steps': 5176, 'loss/train': 1.8367432355880737} +11/06/2021 21:58:58 - INFO - __main__ - Step 5178: {'lr': 0.000499431728131951, 'samples': 994176, 'steps': 5177, 'loss/train': 1.9661235809326172} +11/06/2021 21:58:59 - INFO - __main__ - Step 5179: {'lr': 0.0004994313704701648, 'samples': 994368, 'steps': 5178, 'loss/train': 2.193740129470825} +11/06/2021 21:59:00 - INFO - __main__ - Step 5180: {'lr': 0.0004994310126959887, 'samples': 994560, 'steps': 5179, 'loss/train': 1.998255968093872} +11/06/2021 21:59:00 - INFO - __main__ - Step 5181: {'lr': 0.000499430654809423, 'samples': 994752, 'steps': 5180, 'loss/train': 2.1848907470703125} +11/06/2021 21:59:00 - INFO - __main__ - Step 5182: {'lr': 0.0004994302968104675, 'samples': 994944, 'steps': 5181, 'loss/train': 2.1371874809265137} +11/06/2021 21:59:01 - INFO - __main__ - Step 5183: {'lr': 0.0004994299386991227, 'samples': 995136, 'steps': 5182, 'loss/train': 2.302549362182617} +11/06/2021 21:59:01 - INFO - __main__ - Step 5184: {'lr': 0.0004994295804753885, 'samples': 995328, 'steps': 5183, 'loss/train': 1.9894294738769531} +11/06/2021 21:59:02 - INFO - __main__ - Step 5185: {'lr': 0.0004994292221392652, 'samples': 995520, 'steps': 5184, 'loss/train': 2.0415422916412354} +11/06/2021 21:59:02 - INFO - __main__ - Step 5186: {'lr': 0.000499428863690753, 'samples': 995712, 'steps': 5185, 'loss/train': 2.606383800506592} +11/06/2021 21:59:03 - INFO - __main__ - Step 5187: {'lr': 0.0004994285051298519, 'samples': 995904, 'steps': 5186, 'loss/train': 2.254190444946289} +11/06/2021 21:59:03 - INFO - __main__ - Step 5188: {'lr': 0.0004994281464565623, 'samples': 996096, 'steps': 5187, 'loss/train': 1.9112964868545532} +11/06/2021 21:59:03 - INFO - __main__ - Step 5189: {'lr': 0.0004994277876708841, 'samples': 996288, 'steps': 5188, 'loss/train': 1.7943540811538696} +11/06/2021 21:59:05 - INFO - __main__ - Step 5190: {'lr': 0.0004994274287728177, 'samples': 996480, 'steps': 5189, 'loss/train': 2.0679004192352295} +11/06/2021 21:59:05 - INFO - __main__ - Step 5191: {'lr': 0.0004994270697623631, 'samples': 996672, 'steps': 5190, 'loss/train': 1.3824659585952759} +11/06/2021 21:59:06 - INFO - __main__ - Step 5192: {'lr': 0.0004994267106395205, 'samples': 996864, 'steps': 5191, 'loss/train': 1.7324517965316772} +11/06/2021 21:59:06 - INFO - __main__ - Step 5193: {'lr': 0.0004994263514042901, 'samples': 997056, 'steps': 5192, 'loss/train': 0.9526032209396362} +11/06/2021 21:59:06 - INFO - __main__ - Step 5194: {'lr': 0.0004994259920566719, 'samples': 997248, 'steps': 5193, 'loss/train': 0.5770443677902222} +11/06/2021 21:59:07 - INFO - __main__ - Step 5195: {'lr': 0.0004994256325966663, 'samples': 997440, 'steps': 5194, 'loss/train': 1.4841455221176147} +11/06/2021 21:59:08 - INFO - __main__ - Step 5196: {'lr': 0.0004994252730242734, 'samples': 997632, 'steps': 5195, 'loss/train': 2.2125959396362305} +11/06/2021 21:59:08 - INFO - __main__ - Step 5197: {'lr': 0.0004994249133394933, 'samples': 997824, 'steps': 5196, 'loss/train': 1.9928648471832275} +11/06/2021 21:59:08 - INFO - __main__ - Step 5198: {'lr': 0.0004994245535423262, 'samples': 998016, 'steps': 5197, 'loss/train': 2.454911947250366} +11/06/2021 21:59:09 - INFO - __main__ - Step 5199: {'lr': 0.0004994241936327722, 'samples': 998208, 'steps': 5198, 'loss/train': 1.8284403085708618} +11/06/2021 21:59:10 - INFO - __main__ - Step 5200: {'lr': 0.0004994238336108315, 'samples': 998400, 'steps': 5199, 'loss/train': 1.941856861114502} +11/06/2021 21:59:10 - INFO - __main__ - Step 5201: {'lr': 0.0004994234734765043, 'samples': 998592, 'steps': 5200, 'loss/train': 1.9864927530288696} +11/06/2021 21:59:10 - INFO - __main__ - Step 5202: {'lr': 0.0004994231132297907, 'samples': 998784, 'steps': 5201, 'loss/train': 1.9978981018066406} +11/06/2021 21:59:11 - INFO - __main__ - Step 5203: {'lr': 0.0004994227528706909, 'samples': 998976, 'steps': 5202, 'loss/train': 0.5917396545410156} +11/06/2021 21:59:11 - INFO - __main__ - Step 5204: {'lr': 0.0004994223923992052, 'samples': 999168, 'steps': 5203, 'loss/train': 1.8816064596176147} +11/06/2021 21:59:12 - INFO - __main__ - Step 5205: {'lr': 0.0004994220318153334, 'samples': 999360, 'steps': 5204, 'loss/train': 1.95060133934021} +11/06/2021 21:59:13 - INFO - __main__ - Step 5206: {'lr': 0.000499421671119076, 'samples': 999552, 'steps': 5205, 'loss/train': 2.2630045413970947} +11/06/2021 21:59:13 - INFO - __main__ - Step 5207: {'lr': 0.0004994213103104331, 'samples': 999744, 'steps': 5206, 'loss/train': 1.9655598402023315} +11/06/2021 21:59:13 - INFO - __main__ - Step 5208: {'lr': 0.0004994209493894046, 'samples': 999936, 'steps': 5207, 'loss/train': 2.0341320037841797} +11/06/2021 21:59:14 - INFO - __main__ - Step 5209: {'lr': 0.000499420588355991, 'samples': 1000128, 'steps': 5208, 'loss/train': 2.1907718181610107} +11/06/2021 21:59:14 - INFO - __main__ - Step 5210: {'lr': 0.0004994202272101923, 'samples': 1000320, 'steps': 5209, 'loss/train': 2.0395348072052} +11/06/2021 21:59:15 - INFO - __main__ - Step 5211: {'lr': 0.0004994198659520087, 'samples': 1000512, 'steps': 5210, 'loss/train': 1.4296295642852783} +11/06/2021 21:59:15 - INFO - __main__ - Step 5212: {'lr': 0.0004994195045814404, 'samples': 1000704, 'steps': 5211, 'loss/train': 1.9126372337341309} +11/06/2021 21:59:16 - INFO - __main__ - Step 5213: {'lr': 0.0004994191430984876, 'samples': 1000896, 'steps': 5212, 'loss/train': 1.5323981046676636} +11/06/2021 21:59:16 - INFO - __main__ - Step 5214: {'lr': 0.0004994187815031502, 'samples': 1001088, 'steps': 5213, 'loss/train': 2.079664468765259} +11/06/2021 21:59:16 - INFO - __main__ - Step 5215: {'lr': 0.0004994184197954286, 'samples': 1001280, 'steps': 5214, 'loss/train': 2.4426677227020264} +11/06/2021 21:59:18 - INFO - __main__ - Step 5216: {'lr': 0.000499418057975323, 'samples': 1001472, 'steps': 5215, 'loss/train': 1.766026258468628} +11/06/2021 21:59:18 - INFO - __main__ - Step 5217: {'lr': 0.0004994176960428333, 'samples': 1001664, 'steps': 5216, 'loss/train': 2.4069254398345947} +11/06/2021 21:59:18 - INFO - __main__ - Step 5218: {'lr': 0.00049941733399796, 'samples': 1001856, 'steps': 5217, 'loss/train': 2.27449369430542} +11/06/2021 21:59:19 - INFO - __main__ - Step 5219: {'lr': 0.000499416971840703, 'samples': 1002048, 'steps': 5218, 'loss/train': 1.5242971181869507} +11/06/2021 21:59:19 - INFO - __main__ - Step 5220: {'lr': 0.0004994166095710626, 'samples': 1002240, 'steps': 5219, 'loss/train': 1.8974841833114624} +11/06/2021 21:59:20 - INFO - __main__ - Step 5221: {'lr': 0.000499416247189039, 'samples': 1002432, 'steps': 5220, 'loss/train': 1.832592248916626} +11/06/2021 21:59:21 - INFO - __main__ - Step 5222: {'lr': 0.0004994158846946321, 'samples': 1002624, 'steps': 5221, 'loss/train': 1.9344158172607422} +11/06/2021 21:59:21 - INFO - __main__ - Step 5223: {'lr': 0.0004994155220878425, 'samples': 1002816, 'steps': 5222, 'loss/train': 1.6130883693695068} +11/06/2021 21:59:21 - INFO - __main__ - Step 5224: {'lr': 0.0004994151593686699, 'samples': 1003008, 'steps': 5223, 'loss/train': 0.5793285965919495} +11/06/2021 21:59:22 - INFO - __main__ - Step 5225: {'lr': 0.0004994147965371147, 'samples': 1003200, 'steps': 5224, 'loss/train': 2.1755013465881348} +11/06/2021 21:59:23 - INFO - __main__ - Step 5226: {'lr': 0.0004994144335931772, 'samples': 1003392, 'steps': 5225, 'loss/train': 1.7877094745635986} +11/06/2021 21:59:23 - INFO - __main__ - Step 5227: {'lr': 0.0004994140705368573, 'samples': 1003584, 'steps': 5226, 'loss/train': 2.2187447547912598} +11/06/2021 21:59:24 - INFO - __main__ - Step 5228: {'lr': 0.0004994137073681552, 'samples': 1003776, 'steps': 5227, 'loss/train': 1.6575233936309814} +11/06/2021 21:59:24 - INFO - __main__ - Step 5229: {'lr': 0.0004994133440870712, 'samples': 1003968, 'steps': 5228, 'loss/train': 2.3762245178222656} +11/06/2021 21:59:24 - INFO - __main__ - Step 5230: {'lr': 0.0004994129806936054, 'samples': 1004160, 'steps': 5229, 'loss/train': 2.717776298522949} +11/06/2021 21:59:25 - INFO - __main__ - Step 5231: {'lr': 0.000499412617187758, 'samples': 1004352, 'steps': 5230, 'loss/train': 1.9042540788650513} +11/06/2021 21:59:26 - INFO - __main__ - Step 5232: {'lr': 0.0004994122535695291, 'samples': 1004544, 'steps': 5231, 'loss/train': 2.3282763957977295} +11/06/2021 21:59:26 - INFO - __main__ - Step 5233: {'lr': 0.0004994118898389189, 'samples': 1004736, 'steps': 5232, 'loss/train': 1.996087670326233} +11/06/2021 21:59:26 - INFO - __main__ - Step 5234: {'lr': 0.0004994115259959274, 'samples': 1004928, 'steps': 5233, 'loss/train': 1.9831849336624146} +11/06/2021 21:59:27 - INFO - __main__ - Step 5235: {'lr': 0.0004994111620405551, 'samples': 1005120, 'steps': 5234, 'loss/train': 1.956398844718933} +11/06/2021 21:59:28 - INFO - __main__ - Step 5236: {'lr': 0.0004994107979728019, 'samples': 1005312, 'steps': 5235, 'loss/train': 1.0656429529190063} +11/06/2021 21:59:28 - INFO - __main__ - Step 5237: {'lr': 0.0004994104337926681, 'samples': 1005504, 'steps': 5236, 'loss/train': 2.004157066345215} +11/06/2021 21:59:28 - INFO - __main__ - Step 5238: {'lr': 0.0004994100695001537, 'samples': 1005696, 'steps': 5237, 'loss/train': 1.8911778926849365} +11/06/2021 21:59:29 - INFO - __main__ - Step 5239: {'lr': 0.0004994097050952591, 'samples': 1005888, 'steps': 5238, 'loss/train': 2.1261074542999268} +11/06/2021 21:59:29 - INFO - __main__ - Step 5240: {'lr': 0.0004994093405779842, 'samples': 1006080, 'steps': 5239, 'loss/train': 1.9837573766708374} +11/06/2021 21:59:29 - INFO - __main__ - Step 5241: {'lr': 0.0004994089759483294, 'samples': 1006272, 'steps': 5240, 'loss/train': 1.9001221656799316} +11/06/2021 21:59:31 - INFO - __main__ - Step 5242: {'lr': 0.0004994086112062948, 'samples': 1006464, 'steps': 5241, 'loss/train': 1.5564855337142944} +11/06/2021 21:59:31 - INFO - __main__ - Step 5243: {'lr': 0.0004994082463518804, 'samples': 1006656, 'steps': 5242, 'loss/train': 1.7091917991638184} +11/06/2021 21:59:31 - INFO - __main__ - Step 5244: {'lr': 0.0004994078813850865, 'samples': 1006848, 'steps': 5243, 'loss/train': 2.3507444858551025} +11/06/2021 21:59:32 - INFO - __main__ - Step 5245: {'lr': 0.0004994075163059134, 'samples': 1007040, 'steps': 5244, 'loss/train': 1.456217646598816} +11/06/2021 21:59:32 - INFO - __main__ - Step 5246: {'lr': 0.0004994071511143609, 'samples': 1007232, 'steps': 5245, 'loss/train': 2.2415311336517334} +11/06/2021 21:59:33 - INFO - __main__ - Step 5247: {'lr': 0.0004994067858104296, 'samples': 1007424, 'steps': 5246, 'loss/train': 1.7924270629882812} +11/06/2021 21:59:33 - INFO - __main__ - Step 5248: {'lr': 0.0004994064203941195, 'samples': 1007616, 'steps': 5247, 'loss/train': 1.7448370456695557} +11/06/2021 21:59:34 - INFO - __main__ - Step 5249: {'lr': 0.0004994060548654304, 'samples': 1007808, 'steps': 5248, 'loss/train': 2.0024914741516113} +11/06/2021 21:59:34 - INFO - __main__ - Step 5250: {'lr': 0.000499405689224363, 'samples': 1008000, 'steps': 5249, 'loss/train': 2.1484951972961426} +11/06/2021 21:59:35 - INFO - __main__ - Step 5251: {'lr': 0.0004994053234709172, 'samples': 1008192, 'steps': 5250, 'loss/train': 2.0290279388427734} +11/06/2021 21:59:35 - INFO - __main__ - Step 5252: {'lr': 0.0004994049576050933, 'samples': 1008384, 'steps': 5251, 'loss/train': 1.8063730001449585} +11/06/2021 21:59:36 - INFO - __main__ - Step 5253: {'lr': 0.0004994045916268913, 'samples': 1008576, 'steps': 5252, 'loss/train': 1.8525824546813965} +11/06/2021 21:59:36 - INFO - __main__ - Step 5254: {'lr': 0.0004994042255363115, 'samples': 1008768, 'steps': 5253, 'loss/train': 1.7812204360961914} +11/06/2021 21:59:37 - INFO - __main__ - Step 5255: {'lr': 0.0004994038593333539, 'samples': 1008960, 'steps': 5254, 'loss/train': 1.8962163925170898} +11/06/2021 21:59:37 - INFO - __main__ - Step 5256: {'lr': 0.0004994034930180188, 'samples': 1009152, 'steps': 5255, 'loss/train': 1.78254234790802} +11/06/2021 21:59:38 - INFO - __main__ - Step 5257: {'lr': 0.0004994031265903063, 'samples': 1009344, 'steps': 5256, 'loss/train': 2.477855920791626} +11/06/2021 21:59:38 - INFO - __main__ - Step 5258: {'lr': 0.0004994027600502167, 'samples': 1009536, 'steps': 5257, 'loss/train': 1.9207967519760132} +11/06/2021 21:59:39 - INFO - __main__ - Step 5259: {'lr': 0.00049940239339775, 'samples': 1009728, 'steps': 5258, 'loss/train': 1.7611019611358643} +11/06/2021 21:59:39 - INFO - __main__ - Step 5260: {'lr': 0.0004994020266329064, 'samples': 1009920, 'steps': 5259, 'loss/train': 1.293487548828125} +11/06/2021 21:59:39 - INFO - __main__ - Step 5261: {'lr': 0.0004994016597556862, 'samples': 1010112, 'steps': 5260, 'loss/train': 2.4520223140716553} +11/06/2021 21:59:40 - INFO - __main__ - Step 5262: {'lr': 0.0004994012927660894, 'samples': 1010304, 'steps': 5261, 'loss/train': 2.1690826416015625} +11/06/2021 21:59:41 - INFO - __main__ - Step 5263: {'lr': 0.0004994009256641162, 'samples': 1010496, 'steps': 5262, 'loss/train': 1.7376418113708496} +11/06/2021 21:59:41 - INFO - __main__ - Step 5264: {'lr': 0.0004994005584497667, 'samples': 1010688, 'steps': 5263, 'loss/train': 1.8751423358917236} +11/06/2021 21:59:41 - INFO - __main__ - Step 5265: {'lr': 0.0004994001911230413, 'samples': 1010880, 'steps': 5264, 'loss/train': 1.917157769203186} +11/06/2021 21:59:42 - INFO - __main__ - Step 5266: {'lr': 0.00049939982368394, 'samples': 1011072, 'steps': 5265, 'loss/train': 1.825718879699707} +11/06/2021 21:59:42 - INFO - __main__ - Step 5267: {'lr': 0.000499399456132463, 'samples': 1011264, 'steps': 5266, 'loss/train': 2.2549986839294434} +11/06/2021 21:59:44 - INFO - __main__ - Step 5268: {'lr': 0.0004993990884686105, 'samples': 1011456, 'steps': 5267, 'loss/train': 1.5457383394241333} +11/06/2021 21:59:44 - INFO - __main__ - Step 5269: {'lr': 0.0004993987206923825, 'samples': 1011648, 'steps': 5268, 'loss/train': 1.0259302854537964} +11/06/2021 21:59:44 - INFO - __main__ - Step 5270: {'lr': 0.0004993983528037793, 'samples': 1011840, 'steps': 5269, 'loss/train': 1.1901259422302246} +11/06/2021 21:59:45 - INFO - __main__ - Step 5271: {'lr': 0.0004993979848028011, 'samples': 1012032, 'steps': 5270, 'loss/train': 2.2096664905548096} +11/06/2021 21:59:45 - INFO - __main__ - Step 5272: {'lr': 0.000499397616689448, 'samples': 1012224, 'steps': 5271, 'loss/train': 1.2520197629928589} +11/06/2021 21:59:46 - INFO - __main__ - Step 5273: {'lr': 0.0004993972484637202, 'samples': 1012416, 'steps': 5272, 'loss/train': 1.571405053138733} +11/06/2021 21:59:47 - INFO - __main__ - Step 5274: {'lr': 0.0004993968801256178, 'samples': 1012608, 'steps': 5273, 'loss/train': 2.2659175395965576} +11/06/2021 21:59:47 - INFO - __main__ - Step 5275: {'lr': 0.0004993965116751411, 'samples': 1012800, 'steps': 5274, 'loss/train': 1.6691346168518066} +11/06/2021 21:59:47 - INFO - __main__ - Step 5276: {'lr': 0.0004993961431122901, 'samples': 1012992, 'steps': 5275, 'loss/train': 2.171734094619751} +11/06/2021 21:59:48 - INFO - __main__ - Step 5277: {'lr': 0.0004993957744370651, 'samples': 1013184, 'steps': 5276, 'loss/train': 2.206928253173828} +11/06/2021 21:59:49 - INFO - __main__ - Step 5278: {'lr': 0.0004993954056494662, 'samples': 1013376, 'steps': 5277, 'loss/train': 1.2756541967391968} +11/06/2021 21:59:49 - INFO - __main__ - Step 5279: {'lr': 0.0004993950367494936, 'samples': 1013568, 'steps': 5278, 'loss/train': 2.2866268157958984} +11/06/2021 21:59:49 - INFO - __main__ - Step 5280: {'lr': 0.0004993946677371474, 'samples': 1013760, 'steps': 5279, 'loss/train': 2.0941381454467773} +11/06/2021 21:59:50 - INFO - __main__ - Step 5281: {'lr': 0.0004993942986124278, 'samples': 1013952, 'steps': 5280, 'loss/train': 1.8966882228851318} +11/06/2021 21:59:50 - INFO - __main__ - Step 5282: {'lr': 0.000499393929375335, 'samples': 1014144, 'steps': 5281, 'loss/train': 1.9149951934814453} +11/06/2021 21:59:51 - INFO - __main__ - Step 5283: {'lr': 0.0004993935600258691, 'samples': 1014336, 'steps': 5282, 'loss/train': 2.0702826976776123} +11/06/2021 21:59:51 - INFO - __main__ - Step 5284: {'lr': 0.0004993931905640305, 'samples': 1014528, 'steps': 5283, 'loss/train': 2.0960628986358643} +11/06/2021 21:59:52 - INFO - __main__ - Step 5285: {'lr': 0.000499392820989819, 'samples': 1014720, 'steps': 5284, 'loss/train': 1.8415803909301758} +11/06/2021 21:59:52 - INFO - __main__ - Step 5286: {'lr': 0.0004993924513032349, 'samples': 1014912, 'steps': 5285, 'loss/train': 2.124772071838379} +11/06/2021 21:59:52 - INFO - __main__ - Step 5287: {'lr': 0.0004993920815042785, 'samples': 1015104, 'steps': 5286, 'loss/train': 1.629605770111084} +11/06/2021 21:59:53 - INFO - __main__ - Step 5288: {'lr': 0.0004993917115929498, 'samples': 1015296, 'steps': 5287, 'loss/train': 2.094998359680176} +11/06/2021 21:59:54 - INFO - __main__ - Step 5289: {'lr': 0.0004993913415692492, 'samples': 1015488, 'steps': 5288, 'loss/train': 0.9913315176963806} +11/06/2021 21:59:54 - INFO - __main__ - Step 5290: {'lr': 0.0004993909714331766, 'samples': 1015680, 'steps': 5289, 'loss/train': 2.3629143238067627} +11/06/2021 21:59:54 - INFO - __main__ - Step 5291: {'lr': 0.0004993906011847323, 'samples': 1015872, 'steps': 5290, 'loss/train': 1.4902851581573486} +11/06/2021 21:59:55 - INFO - __main__ - Step 5292: {'lr': 0.0004993902308239164, 'samples': 1016064, 'steps': 5291, 'loss/train': 2.1800575256347656} +11/06/2021 21:59:55 - INFO - __main__ - Step 5293: {'lr': 0.0004993898603507292, 'samples': 1016256, 'steps': 5292, 'loss/train': 1.8672491312026978} +11/06/2021 21:59:56 - INFO - __main__ - Step 5294: {'lr': 0.0004993894897651706, 'samples': 1016448, 'steps': 5293, 'loss/train': 1.4217222929000854} +11/06/2021 21:59:57 - INFO - __main__ - Step 5295: {'lr': 0.0004993891190672411, 'samples': 1016640, 'steps': 5294, 'loss/train': 2.300929307937622} +11/06/2021 21:59:57 - INFO - __main__ - Step 5296: {'lr': 0.0004993887482569407, 'samples': 1016832, 'steps': 5295, 'loss/train': 1.8544442653656006} +11/06/2021 21:59:57 - INFO - __main__ - Step 5297: {'lr': 0.0004993883773342695, 'samples': 1017024, 'steps': 5296, 'loss/train': 1.9744642972946167} +11/06/2021 21:59:58 - INFO - __main__ - Step 5298: {'lr': 0.0004993880062992279, 'samples': 1017216, 'steps': 5297, 'loss/train': 1.6615900993347168} +11/06/2021 21:59:58 - INFO - __main__ - Step 5299: {'lr': 0.0004993876351518157, 'samples': 1017408, 'steps': 5298, 'loss/train': 1.865243911743164} +11/06/2021 21:59:59 - INFO - __main__ - Step 5300: {'lr': 0.0004993872638920335, 'samples': 1017600, 'steps': 5299, 'loss/train': 1.881446123123169} +11/06/2021 22:00:00 - INFO - __main__ - Step 5301: {'lr': 0.0004993868925198811, 'samples': 1017792, 'steps': 5300, 'loss/train': 2.0153396129608154} +11/06/2021 22:00:00 - INFO - __main__ - Step 5302: {'lr': 0.0004993865210353588, 'samples': 1017984, 'steps': 5301, 'loss/train': 1.8959330320358276} +11/06/2021 22:00:00 - INFO - __main__ - Step 5303: {'lr': 0.0004993861494384669, 'samples': 1018176, 'steps': 5302, 'loss/train': 1.8540432453155518} +11/06/2021 22:00:01 - INFO - __main__ - Step 5304: {'lr': 0.0004993857777292053, 'samples': 1018368, 'steps': 5303, 'loss/train': 1.6123359203338623} +11/06/2021 22:00:02 - INFO - __main__ - Step 5305: {'lr': 0.0004993854059075745, 'samples': 1018560, 'steps': 5304, 'loss/train': 2.1076877117156982} +11/06/2021 22:00:02 - INFO - __main__ - Step 5306: {'lr': 0.0004993850339735744, 'samples': 1018752, 'steps': 5305, 'loss/train': 1.8283599615097046} +11/06/2021 22:00:02 - INFO - __main__ - Step 5307: {'lr': 0.0004993846619272052, 'samples': 1018944, 'steps': 5306, 'loss/train': 2.057713508605957} +11/06/2021 22:00:03 - INFO - __main__ - Step 5308: {'lr': 0.0004993842897684672, 'samples': 1019136, 'steps': 5307, 'loss/train': 1.3499886989593506} +11/06/2021 22:00:03 - INFO - __main__ - Step 5309: {'lr': 0.0004993839174973604, 'samples': 1019328, 'steps': 5308, 'loss/train': 1.8223806619644165} +11/06/2021 22:00:04 - INFO - __main__ - Step 5310: {'lr': 0.0004993835451138851, 'samples': 1019520, 'steps': 5309, 'loss/train': 1.0041699409484863} +11/06/2021 22:00:04 - INFO - __main__ - Step 5311: {'lr': 0.0004993831726180414, 'samples': 1019712, 'steps': 5310, 'loss/train': 0.6815013289451599} +11/06/2021 22:00:05 - INFO - __main__ - Step 5312: {'lr': 0.0004993828000098296, 'samples': 1019904, 'steps': 5311, 'loss/train': 1.6194506883621216} +11/06/2021 22:00:05 - INFO - __main__ - Step 5313: {'lr': 0.0004993824272892497, 'samples': 1020096, 'steps': 5312, 'loss/train': 1.8829015493392944} +11/06/2021 22:00:05 - INFO - __main__ - Step 5314: {'lr': 0.0004993820544563018, 'samples': 1020288, 'steps': 5313, 'loss/train': 2.2411489486694336} +11/06/2021 22:00:06 - INFO - __main__ - Step 5315: {'lr': 0.0004993816815109863, 'samples': 1020480, 'steps': 5314, 'loss/train': 1.758228063583374} +11/06/2021 22:00:07 - INFO - __main__ - Step 5316: {'lr': 0.0004993813084533033, 'samples': 1020672, 'steps': 5315, 'loss/train': 1.9328948259353638} +11/06/2021 22:00:07 - INFO - __main__ - Step 5317: {'lr': 0.0004993809352832529, 'samples': 1020864, 'steps': 5316, 'loss/train': 1.9451228380203247} +11/06/2021 22:00:08 - INFO - __main__ - Step 5318: {'lr': 0.0004993805620008353, 'samples': 1021056, 'steps': 5317, 'loss/train': 2.118875026702881} +11/06/2021 22:00:08 - INFO - __main__ - Step 5319: {'lr': 0.0004993801886060506, 'samples': 1021248, 'steps': 5318, 'loss/train': 2.0214946269989014} +11/06/2021 22:00:09 - INFO - __main__ - Step 5320: {'lr': 0.0004993798150988991, 'samples': 1021440, 'steps': 5319, 'loss/train': 2.4562036991119385} +11/06/2021 22:00:09 - INFO - __main__ - Step 5321: {'lr': 0.0004993794414793808, 'samples': 1021632, 'steps': 5320, 'loss/train': 1.9569580554962158} +11/06/2021 22:00:10 - INFO - __main__ - Step 5322: {'lr': 0.0004993790677474962, 'samples': 1021824, 'steps': 5321, 'loss/train': 1.3694133758544922} +11/06/2021 22:00:10 - INFO - __main__ - Step 5323: {'lr': 0.0004993786939032451, 'samples': 1022016, 'steps': 5322, 'loss/train': 1.7816057205200195} +11/06/2021 22:00:10 - INFO - __main__ - Step 5324: {'lr': 0.0004993783199466278, 'samples': 1022208, 'steps': 5323, 'loss/train': 2.492426633834839} +11/06/2021 22:00:11 - INFO - __main__ - Step 5325: {'lr': 0.0004993779458776444, 'samples': 1022400, 'steps': 5324, 'loss/train': 2.574648857116699} +11/06/2021 22:00:12 - INFO - __main__ - Step 5326: {'lr': 0.0004993775716962953, 'samples': 1022592, 'steps': 5325, 'loss/train': 1.6549577713012695} +11/06/2021 22:00:12 - INFO - __main__ - Step 5327: {'lr': 0.0004993771974025805, 'samples': 1022784, 'steps': 5326, 'loss/train': 1.884212851524353} +11/06/2021 22:00:12 - INFO - __main__ - Step 5328: {'lr': 0.0004993768229965001, 'samples': 1022976, 'steps': 5327, 'loss/train': 2.4046313762664795} +11/06/2021 22:00:13 - INFO - __main__ - Step 5329: {'lr': 0.0004993764484780543, 'samples': 1023168, 'steps': 5328, 'loss/train': 1.4917925596237183} +11/06/2021 22:00:13 - INFO - __main__ - Step 5330: {'lr': 0.0004993760738472435, 'samples': 1023360, 'steps': 5329, 'loss/train': 1.8615087270736694} +11/06/2021 22:00:14 - INFO - __main__ - Step 5331: {'lr': 0.0004993756991040675, 'samples': 1023552, 'steps': 5330, 'loss/train': 1.8130137920379639} +11/06/2021 22:00:14 - INFO - __main__ - Step 5332: {'lr': 0.0004993753242485268, 'samples': 1023744, 'steps': 5331, 'loss/train': 2.364469051361084} +11/06/2021 22:00:15 - INFO - __main__ - Step 5333: {'lr': 0.0004993749492806214, 'samples': 1023936, 'steps': 5332, 'loss/train': 2.498106002807617} +11/06/2021 22:00:15 - INFO - __main__ - Step 5334: {'lr': 0.0004993745742003515, 'samples': 1024128, 'steps': 5333, 'loss/train': 1.809753656387329} +11/06/2021 22:00:16 - INFO - __main__ - Step 5335: {'lr': 0.0004993741990077172, 'samples': 1024320, 'steps': 5334, 'loss/train': 2.3342111110687256} +11/06/2021 22:00:16 - INFO - __main__ - Step 5336: {'lr': 0.0004993738237027188, 'samples': 1024512, 'steps': 5335, 'loss/train': 2.1999897956848145} +11/06/2021 22:00:17 - INFO - __main__ - Step 5337: {'lr': 0.0004993734482853563, 'samples': 1024704, 'steps': 5336, 'loss/train': 2.134817123413086} +11/06/2021 22:00:17 - INFO - __main__ - Step 5338: {'lr': 0.0004993730727556301, 'samples': 1024896, 'steps': 5337, 'loss/train': 1.9797841310501099} +11/06/2021 22:00:17 - INFO - __main__ - Step 5339: {'lr': 0.0004993726971135402, 'samples': 1025088, 'steps': 5338, 'loss/train': 1.4383511543273926} +11/06/2021 22:00:18 - INFO - __main__ - Step 5340: {'lr': 0.0004993723213590868, 'samples': 1025280, 'steps': 5339, 'loss/train': 2.2036027908325195} +11/06/2021 22:00:19 - INFO - __main__ - Step 5341: {'lr': 0.0004993719454922701, 'samples': 1025472, 'steps': 5340, 'loss/train': 2.0086007118225098} +11/06/2021 22:00:19 - INFO - __main__ - Step 5342: {'lr': 0.0004993715695130902, 'samples': 1025664, 'steps': 5341, 'loss/train': 1.6373944282531738} +11/06/2021 22:00:20 - INFO - __main__ - Step 5343: {'lr': 0.0004993711934215473, 'samples': 1025856, 'steps': 5342, 'loss/train': 1.591683268547058} +11/06/2021 22:00:20 - INFO - __main__ - Step 5344: {'lr': 0.0004993708172176417, 'samples': 1026048, 'steps': 5343, 'loss/train': 1.9710315465927124} +11/06/2021 22:00:20 - INFO - __main__ - Step 5345: {'lr': 0.0004993704409013734, 'samples': 1026240, 'steps': 5344, 'loss/train': 2.084678888320923} +11/06/2021 22:00:21 - INFO - __main__ - Step 5346: {'lr': 0.0004993700644727425, 'samples': 1026432, 'steps': 5345, 'loss/train': 2.1554689407348633} +11/06/2021 22:00:22 - INFO - __main__ - Step 5347: {'lr': 0.0004993696879317495, 'samples': 1026624, 'steps': 5346, 'loss/train': 1.5472863912582397} +11/06/2021 22:00:22 - INFO - __main__ - Step 5348: {'lr': 0.0004993693112783943, 'samples': 1026816, 'steps': 5347, 'loss/train': 1.995734691619873} +11/06/2021 22:00:22 - INFO - __main__ - Step 5349: {'lr': 0.0004993689345126771, 'samples': 1027008, 'steps': 5348, 'loss/train': 2.151108503341675} +11/06/2021 22:00:23 - INFO - __main__ - Step 5350: {'lr': 0.0004993685576345981, 'samples': 1027200, 'steps': 5349, 'loss/train': 2.3165838718414307} +11/06/2021 22:00:24 - INFO - __main__ - Step 5351: {'lr': 0.0004993681806441575, 'samples': 1027392, 'steps': 5350, 'loss/train': 2.325005292892456} +11/06/2021 22:00:24 - INFO - __main__ - Step 5352: {'lr': 0.0004993678035413554, 'samples': 1027584, 'steps': 5351, 'loss/train': 1.954711675643921} +11/06/2021 22:00:24 - INFO - __main__ - Step 5353: {'lr': 0.0004993674263261921, 'samples': 1027776, 'steps': 5352, 'loss/train': 1.639163851737976} +11/06/2021 22:00:25 - INFO - __main__ - Step 5354: {'lr': 0.0004993670489986677, 'samples': 1027968, 'steps': 5353, 'loss/train': 2.0933964252471924} +11/06/2021 22:00:25 - INFO - __main__ - Step 5355: {'lr': 0.0004993666715587823, 'samples': 1028160, 'steps': 5354, 'loss/train': 2.3471012115478516} +11/06/2021 22:00:26 - INFO - __main__ - Step 5356: {'lr': 0.0004993662940065361, 'samples': 1028352, 'steps': 5355, 'loss/train': 1.8415415287017822} +11/06/2021 22:00:26 - INFO - __main__ - Step 5357: {'lr': 0.0004993659163419294, 'samples': 1028544, 'steps': 5356, 'loss/train': 2.263580322265625} +11/06/2021 22:00:27 - INFO - __main__ - Step 5358: {'lr': 0.0004993655385649621, 'samples': 1028736, 'steps': 5357, 'loss/train': 1.8695333003997803} +11/06/2021 22:00:27 - INFO - __main__ - Step 5359: {'lr': 0.0004993651606756347, 'samples': 1028928, 'steps': 5358, 'loss/train': 2.1542937755584717} +11/06/2021 22:00:28 - INFO - __main__ - Step 5360: {'lr': 0.0004993647826739471, 'samples': 1029120, 'steps': 5359, 'loss/train': 1.7459410429000854} +11/06/2021 22:00:28 - INFO - __main__ - Step 5361: {'lr': 0.0004993644045598997, 'samples': 1029312, 'steps': 5360, 'loss/train': 2.4149515628814697} +11/06/2021 22:00:29 - INFO - __main__ - Step 5362: {'lr': 0.0004993640263334924, 'samples': 1029504, 'steps': 5361, 'loss/train': 1.8618431091308594} +11/06/2021 22:00:29 - INFO - __main__ - Step 5363: {'lr': 0.0004993636479947256, 'samples': 1029696, 'steps': 5362, 'loss/train': 1.1702266931533813} +11/06/2021 22:00:30 - INFO - __main__ - Step 5364: {'lr': 0.0004993632695435993, 'samples': 1029888, 'steps': 5363, 'loss/train': 2.124359369277954} +11/06/2021 22:00:30 - INFO - __main__ - Step 5365: {'lr': 0.0004993628909801138, 'samples': 1030080, 'steps': 5364, 'loss/train': 1.8695933818817139} +11/06/2021 22:00:31 - INFO - __main__ - Step 5366: {'lr': 0.0004993625123042694, 'samples': 1030272, 'steps': 5365, 'loss/train': 2.126741409301758} +11/06/2021 22:00:31 - INFO - __main__ - Step 5367: {'lr': 0.0004993621335160659, 'samples': 1030464, 'steps': 5366, 'loss/train': 2.1236331462860107} +11/06/2021 22:00:32 - INFO - __main__ - Step 5368: {'lr': 0.0004993617546155037, 'samples': 1030656, 'steps': 5367, 'loss/train': 1.1388921737670898} +11/06/2021 22:00:32 - INFO - __main__ - Step 5369: {'lr': 0.000499361375602583, 'samples': 1030848, 'steps': 5368, 'loss/train': 2.0226683616638184} +11/06/2021 22:00:32 - INFO - __main__ - Step 5370: {'lr': 0.0004993609964773039, 'samples': 1031040, 'steps': 5369, 'loss/train': 1.933193325996399} +11/06/2021 22:00:33 - INFO - __main__ - Step 5371: {'lr': 0.0004993606172396665, 'samples': 1031232, 'steps': 5370, 'loss/train': 1.9464812278747559} +11/06/2021 22:00:34 - INFO - __main__ - Step 5372: {'lr': 0.0004993602378896712, 'samples': 1031424, 'steps': 5371, 'loss/train': 1.1575310230255127} +11/06/2021 22:00:34 - INFO - __main__ - Step 5373: {'lr': 0.0004993598584273179, 'samples': 1031616, 'steps': 5372, 'loss/train': 2.0827817916870117} +11/06/2021 22:00:34 - INFO - __main__ - Step 5374: {'lr': 0.0004993594788526069, 'samples': 1031808, 'steps': 5373, 'loss/train': 2.1130635738372803} +11/06/2021 22:00:35 - INFO - __main__ - Step 5375: {'lr': 0.0004993590991655384, 'samples': 1032000, 'steps': 5374, 'loss/train': 2.0169715881347656} +11/06/2021 22:00:35 - INFO - __main__ - Step 5376: {'lr': 0.0004993587193661126, 'samples': 1032192, 'steps': 5375, 'loss/train': 2.4737699031829834} +11/06/2021 22:00:36 - INFO - __main__ - Step 5377: {'lr': 0.0004993583394543295, 'samples': 1032384, 'steps': 5376, 'loss/train': 1.8116259574890137} +11/06/2021 22:00:37 - INFO - __main__ - Step 5378: {'lr': 0.0004993579594301895, 'samples': 1032576, 'steps': 5377, 'loss/train': 1.8319172859191895} +11/06/2021 22:00:37 - INFO - __main__ - Step 5379: {'lr': 0.0004993575792936925, 'samples': 1032768, 'steps': 5378, 'loss/train': 1.6784554719924927} +11/06/2021 22:00:37 - INFO - __main__ - Step 5380: {'lr': 0.000499357199044839, 'samples': 1032960, 'steps': 5379, 'loss/train': 1.458201289176941} +11/06/2021 22:00:38 - INFO - __main__ - Step 5381: {'lr': 0.0004993568186836288, 'samples': 1033152, 'steps': 5380, 'loss/train': 1.8276842832565308} +11/06/2021 22:00:39 - INFO - __main__ - Step 5382: {'lr': 0.0004993564382100624, 'samples': 1033344, 'steps': 5381, 'loss/train': 1.3644241094589233} +11/06/2021 22:00:39 - INFO - __main__ - Step 5383: {'lr': 0.0004993560576241398, 'samples': 1033536, 'steps': 5382, 'loss/train': 1.386871337890625} +11/06/2021 22:00:39 - INFO - __main__ - Step 5384: {'lr': 0.0004993556769258612, 'samples': 1033728, 'steps': 5383, 'loss/train': 1.235226035118103} +11/06/2021 22:00:40 - INFO - __main__ - Step 5385: {'lr': 0.0004993552961152268, 'samples': 1033920, 'steps': 5384, 'loss/train': 1.334904670715332} +11/06/2021 22:00:40 - INFO - __main__ - Step 5386: {'lr': 0.0004993549151922367, 'samples': 1034112, 'steps': 5385, 'loss/train': 2.5312018394470215} +11/06/2021 22:00:41 - INFO - __main__ - Step 5387: {'lr': 0.0004993545341568912, 'samples': 1034304, 'steps': 5386, 'loss/train': 1.546046257019043} +11/06/2021 22:00:41 - INFO - __main__ - Step 5388: {'lr': 0.0004993541530091903, 'samples': 1034496, 'steps': 5387, 'loss/train': 1.8282663822174072} +11/06/2021 22:00:42 - INFO - __main__ - Step 5389: {'lr': 0.0004993537717491343, 'samples': 1034688, 'steps': 5388, 'loss/train': 2.0151655673980713} +11/06/2021 22:00:42 - INFO - __main__ - Step 5390: {'lr': 0.0004993533903767235, 'samples': 1034880, 'steps': 5389, 'loss/train': 1.5707823038101196} +11/06/2021 22:00:42 - INFO - __main__ - Step 5391: {'lr': 0.0004993530088919577, 'samples': 1035072, 'steps': 5390, 'loss/train': 1.7136812210083008} +11/06/2021 22:00:43 - INFO - __main__ - Step 5392: {'lr': 0.0004993526272948374, 'samples': 1035264, 'steps': 5391, 'loss/train': 0.6717694401741028} +11/06/2021 22:00:44 - INFO - __main__ - Step 5393: {'lr': 0.0004993522455853626, 'samples': 1035456, 'steps': 5392, 'loss/train': 1.5146379470825195} +11/06/2021 22:00:44 - INFO - __main__ - Step 5394: {'lr': 0.0004993518637635334, 'samples': 1035648, 'steps': 5393, 'loss/train': 1.4863612651824951} +11/06/2021 22:00:45 - INFO - __main__ - Step 5395: {'lr': 0.0004993514818293503, 'samples': 1035840, 'steps': 5394, 'loss/train': 1.7902588844299316} +11/06/2021 22:00:45 - INFO - __main__ - Step 5396: {'lr': 0.0004993510997828132, 'samples': 1036032, 'steps': 5395, 'loss/train': 1.7345638275146484} +11/06/2021 22:00:45 - INFO - __main__ - Step 5397: {'lr': 0.0004993507176239224, 'samples': 1036224, 'steps': 5396, 'loss/train': 1.4879080057144165} +11/06/2021 22:00:46 - INFO - __main__ - Step 5398: {'lr': 0.0004993503353526779, 'samples': 1036416, 'steps': 5397, 'loss/train': 1.566808819770813} +11/06/2021 22:00:47 - INFO - __main__ - Step 5399: {'lr': 0.0004993499529690801, 'samples': 1036608, 'steps': 5398, 'loss/train': 1.6237696409225464} +11/06/2021 22:00:47 - INFO - __main__ - Step 5400: {'lr': 0.000499349570473129, 'samples': 1036800, 'steps': 5399, 'loss/train': 2.0763614177703857} +11/06/2021 22:00:47 - INFO - __main__ - Step 5401: {'lr': 0.0004993491878648249, 'samples': 1036992, 'steps': 5400, 'loss/train': 2.139653444290161} +11/06/2021 22:00:48 - INFO - __main__ - Step 5402: {'lr': 0.0004993488051441677, 'samples': 1037184, 'steps': 5401, 'loss/train': 1.2702760696411133} +11/06/2021 22:00:49 - INFO - __main__ - Step 5403: {'lr': 0.000499348422311158, 'samples': 1037376, 'steps': 5402, 'loss/train': 1.7422914505004883} +11/06/2021 22:00:49 - INFO - __main__ - Step 5404: {'lr': 0.0004993480393657956, 'samples': 1037568, 'steps': 5403, 'loss/train': 1.667367935180664} +11/06/2021 22:00:50 - INFO - __main__ - Step 5405: {'lr': 0.0004993476563080809, 'samples': 1037760, 'steps': 5404, 'loss/train': 1.849706768989563} +11/06/2021 22:00:50 - INFO - __main__ - Step 5406: {'lr': 0.000499347273138014, 'samples': 1037952, 'steps': 5405, 'loss/train': 1.485642433166504} +11/06/2021 22:00:50 - INFO - __main__ - Step 5407: {'lr': 0.000499346889855595, 'samples': 1038144, 'steps': 5406, 'loss/train': 1.8878998756408691} +11/06/2021 22:00:51 - INFO - __main__ - Step 5408: {'lr': 0.0004993465064608242, 'samples': 1038336, 'steps': 5407, 'loss/train': 2.2448551654815674} +11/06/2021 22:00:52 - INFO - __main__ - Step 5409: {'lr': 0.0004993461229537017, 'samples': 1038528, 'steps': 5408, 'loss/train': 1.8952325582504272} +11/06/2021 22:00:52 - INFO - __main__ - Step 5410: {'lr': 0.0004993457393342276, 'samples': 1038720, 'steps': 5409, 'loss/train': 1.7118123769760132} +11/06/2021 22:00:52 - INFO - __main__ - Step 5411: {'lr': 0.0004993453556024023, 'samples': 1038912, 'steps': 5410, 'loss/train': 1.6171423196792603} +11/06/2021 22:00:53 - INFO - __main__ - Step 5412: {'lr': 0.0004993449717582258, 'samples': 1039104, 'steps': 5411, 'loss/train': 1.8556959629058838} +11/06/2021 22:00:53 - INFO - __main__ - Step 5413: {'lr': 0.0004993445878016982, 'samples': 1039296, 'steps': 5412, 'loss/train': 2.079441547393799} +11/06/2021 22:00:54 - INFO - __main__ - Step 5414: {'lr': 0.0004993442037328199, 'samples': 1039488, 'steps': 5413, 'loss/train': 2.005168914794922} +11/06/2021 22:00:54 - INFO - __main__ - Step 5415: {'lr': 0.0004993438195515909, 'samples': 1039680, 'steps': 5414, 'loss/train': 1.7402551174163818} +11/06/2021 22:00:55 - INFO - __main__ - Step 5416: {'lr': 0.0004993434352580115, 'samples': 1039872, 'steps': 5415, 'loss/train': 1.5889499187469482} +11/06/2021 22:00:55 - INFO - __main__ - Step 5417: {'lr': 0.0004993430508520816, 'samples': 1040064, 'steps': 5416, 'loss/train': 2.1305549144744873} +11/06/2021 22:00:55 - INFO - __main__ - Step 5418: {'lr': 0.0004993426663338018, 'samples': 1040256, 'steps': 5417, 'loss/train': 1.9073415994644165} +11/06/2021 22:00:57 - INFO - __main__ - Step 5419: {'lr': 0.0004993422817031719, 'samples': 1040448, 'steps': 5418, 'loss/train': 2.1884820461273193} +11/06/2021 22:00:57 - INFO - __main__ - Step 5420: {'lr': 0.0004993418969601921, 'samples': 1040640, 'steps': 5419, 'loss/train': 2.154372215270996} +11/06/2021 22:00:57 - INFO - __main__ - Step 5421: {'lr': 0.0004993415121048629, 'samples': 1040832, 'steps': 5420, 'loss/train': 1.9942115545272827} +11/06/2021 22:00:58 - INFO - __main__ - Step 5422: {'lr': 0.0004993411271371842, 'samples': 1041024, 'steps': 5421, 'loss/train': 1.9106769561767578} +11/06/2021 22:00:58 - INFO - __main__ - Step 5423: {'lr': 0.0004993407420571563, 'samples': 1041216, 'steps': 5422, 'loss/train': 1.0730233192443848} +11/06/2021 22:00:59 - INFO - __main__ - Step 5424: {'lr': 0.0004993403568647792, 'samples': 1041408, 'steps': 5423, 'loss/train': 2.985499143600464} +11/06/2021 22:01:00 - INFO - __main__ - Step 5425: {'lr': 0.0004993399715600531, 'samples': 1041600, 'steps': 5424, 'loss/train': 1.9801826477050781} +11/06/2021 22:01:00 - INFO - __main__ - Step 5426: {'lr': 0.0004993395861429785, 'samples': 1041792, 'steps': 5425, 'loss/train': 2.2979655265808105} +11/06/2021 22:01:00 - INFO - __main__ - Step 5427: {'lr': 0.0004993392006135552, 'samples': 1041984, 'steps': 5426, 'loss/train': 1.975477933883667} +11/06/2021 22:01:01 - INFO - __main__ - Step 5428: {'lr': 0.0004993388149717834, 'samples': 1042176, 'steps': 5427, 'loss/train': 1.659934639930725} +11/06/2021 22:01:02 - INFO - __main__ - Step 5429: {'lr': 0.0004993384292176636, 'samples': 1042368, 'steps': 5428, 'loss/train': 0.41693881154060364} +11/06/2021 22:01:02 - INFO - __main__ - Step 5430: {'lr': 0.0004993380433511956, 'samples': 1042560, 'steps': 5429, 'loss/train': 1.881492257118225} +11/06/2021 22:01:03 - INFO - __main__ - Step 5431: {'lr': 0.0004993376573723798, 'samples': 1042752, 'steps': 5430, 'loss/train': 2.2154150009155273} +11/06/2021 22:01:03 - INFO - __main__ - Step 5432: {'lr': 0.0004993372712812162, 'samples': 1042944, 'steps': 5431, 'loss/train': 2.0306501388549805} +11/06/2021 22:01:04 - INFO - __main__ - Step 5433: {'lr': 0.0004993368850777052, 'samples': 1043136, 'steps': 5432, 'loss/train': 2.2101669311523438} +11/06/2021 22:01:04 - INFO - __main__ - Step 5434: {'lr': 0.0004993364987618468, 'samples': 1043328, 'steps': 5433, 'loss/train': 2.0793869495391846} +11/06/2021 22:01:05 - INFO - __main__ - Step 5435: {'lr': 0.0004993361123336412, 'samples': 1043520, 'steps': 5434, 'loss/train': 1.7962534427642822} +11/06/2021 22:01:05 - INFO - __main__ - Step 5436: {'lr': 0.0004993357257930887, 'samples': 1043712, 'steps': 5435, 'loss/train': 2.5018160343170166} +11/06/2021 22:01:06 - INFO - __main__ - Step 5437: {'lr': 0.0004993353391401892, 'samples': 1043904, 'steps': 5436, 'loss/train': 2.258634567260742} +11/06/2021 22:01:06 - INFO - __main__ - Step 5438: {'lr': 0.0004993349523749431, 'samples': 1044096, 'steps': 5437, 'loss/train': 1.8289518356323242} +11/06/2021 22:01:07 - INFO - __main__ - Step 5439: {'lr': 0.0004993345654973505, 'samples': 1044288, 'steps': 5438, 'loss/train': 1.9161920547485352} +11/06/2021 22:01:07 - INFO - __main__ - Step 5440: {'lr': 0.0004993341785074116, 'samples': 1044480, 'steps': 5439, 'loss/train': 2.753596305847168} +11/06/2021 22:01:07 - INFO - __main__ - Step 5441: {'lr': 0.0004993337914051266, 'samples': 1044672, 'steps': 5440, 'loss/train': 1.9837926626205444} +11/06/2021 22:01:08 - INFO - __main__ - Step 5442: {'lr': 0.0004993334041904957, 'samples': 1044864, 'steps': 5441, 'loss/train': 0.3798553943634033} +11/06/2021 22:01:09 - INFO - __main__ - Step 5443: {'lr': 0.0004993330168635189, 'samples': 1045056, 'steps': 5442, 'loss/train': 1.5008134841918945} +11/06/2021 22:01:09 - INFO - __main__ - Step 5444: {'lr': 0.0004993326294241966, 'samples': 1045248, 'steps': 5443, 'loss/train': 0.524370014667511} +11/06/2021 22:01:09 - INFO - __main__ - Step 5445: {'lr': 0.0004993322418725286, 'samples': 1045440, 'steps': 5444, 'loss/train': 1.8944960832595825} +11/06/2021 22:01:10 - INFO - __main__ - Step 5446: {'lr': 0.0004993318542085157, 'samples': 1045632, 'steps': 5445, 'loss/train': 2.161842107772827} +11/06/2021 22:01:11 - INFO - __main__ - Step 5447: {'lr': 0.0004993314664321575, 'samples': 1045824, 'steps': 5446, 'loss/train': 2.0262186527252197} +11/06/2021 22:01:11 - INFO - __main__ - Step 5448: {'lr': 0.0004993310785434544, 'samples': 1046016, 'steps': 5447, 'loss/train': 1.3276009559631348} +11/06/2021 22:01:11 - INFO - __main__ - Step 5449: {'lr': 0.0004993306905424067, 'samples': 1046208, 'steps': 5448, 'loss/train': 1.6204453706741333} +11/06/2021 22:01:12 - INFO - __main__ - Step 5450: {'lr': 0.0004993303024290143, 'samples': 1046400, 'steps': 5449, 'loss/train': 2.0517914295196533} +11/06/2021 22:01:12 - INFO - __main__ - Step 5451: {'lr': 0.0004993299142032776, 'samples': 1046592, 'steps': 5450, 'loss/train': 1.5047802925109863} +11/06/2021 22:01:13 - INFO - __main__ - Step 5452: {'lr': 0.0004993295258651966, 'samples': 1046784, 'steps': 5451, 'loss/train': 2.418118953704834} +11/06/2021 22:01:14 - INFO - __main__ - Step 5453: {'lr': 0.0004993291374147716, 'samples': 1046976, 'steps': 5452, 'loss/train': 0.4726817011833191} +11/06/2021 22:01:14 - INFO - __main__ - Step 5454: {'lr': 0.0004993287488520027, 'samples': 1047168, 'steps': 5453, 'loss/train': 2.1030688285827637} +11/06/2021 22:01:14 - INFO - __main__ - Step 5455: {'lr': 0.0004993283601768902, 'samples': 1047360, 'steps': 5454, 'loss/train': 2.6343281269073486} +11/06/2021 22:01:15 - INFO - __main__ - Step 5456: {'lr': 0.0004993279713894342, 'samples': 1047552, 'steps': 5455, 'loss/train': 2.150969982147217} +11/06/2021 22:01:16 - INFO - __main__ - Step 5457: {'lr': 0.0004993275824896348, 'samples': 1047744, 'steps': 5456, 'loss/train': 1.408422827720642} +11/06/2021 22:01:16 - INFO - __main__ - Step 5458: {'lr': 0.0004993271934774922, 'samples': 1047936, 'steps': 5457, 'loss/train': 1.94776451587677} +11/06/2021 22:01:16 - INFO - __main__ - Step 5459: {'lr': 0.0004993268043530067, 'samples': 1048128, 'steps': 5458, 'loss/train': 1.2634351253509521} +11/06/2021 22:01:17 - INFO - __main__ - Step 5460: {'lr': 0.0004993264151161783, 'samples': 1048320, 'steps': 5459, 'loss/train': 1.6682987213134766} +11/06/2021 22:01:17 - INFO - __main__ - Step 5461: {'lr': 0.0004993260257670074, 'samples': 1048512, 'steps': 5460, 'loss/train': 2.2864060401916504} +11/06/2021 22:01:18 - INFO - __main__ - Step 5462: {'lr': 0.000499325636305494, 'samples': 1048704, 'steps': 5461, 'loss/train': 1.3038978576660156} +11/06/2021 22:01:18 - INFO - __main__ - Step 5463: {'lr': 0.0004993252467316382, 'samples': 1048896, 'steps': 5462, 'loss/train': 1.608263373374939} +11/06/2021 22:01:19 - INFO - __main__ - Step 5464: {'lr': 0.0004993248570454404, 'samples': 1049088, 'steps': 5463, 'loss/train': 1.6738258600234985} +11/06/2021 22:01:19 - INFO - __main__ - Step 5465: {'lr': 0.0004993244672469007, 'samples': 1049280, 'steps': 5464, 'loss/train': 2.2814807891845703} +11/06/2021 22:01:19 - INFO - __main__ - Step 5466: {'lr': 0.000499324077336019, 'samples': 1049472, 'steps': 5465, 'loss/train': 1.8330951929092407} +11/06/2021 22:01:20 - INFO - __main__ - Step 5467: {'lr': 0.000499323687312796, 'samples': 1049664, 'steps': 5466, 'loss/train': 1.905300498008728} +11/06/2021 22:01:21 - INFO - __main__ - Step 5468: {'lr': 0.0004993232971772315, 'samples': 1049856, 'steps': 5467, 'loss/train': 1.9987244606018066} +11/06/2021 22:01:21 - INFO - __main__ - Step 5469: {'lr': 0.0004993229069293257, 'samples': 1050048, 'steps': 5468, 'loss/train': 2.0383851528167725} +11/06/2021 22:01:21 - INFO - __main__ - Step 5470: {'lr': 0.0004993225165690789, 'samples': 1050240, 'steps': 5469, 'loss/train': 1.96856689453125} +11/06/2021 22:01:22 - INFO - __main__ - Step 5471: {'lr': 0.0004993221260964912, 'samples': 1050432, 'steps': 5470, 'loss/train': 2.155994415283203} +11/06/2021 22:01:22 - INFO - __main__ - Step 5472: {'lr': 0.0004993217355115628, 'samples': 1050624, 'steps': 5471, 'loss/train': 2.175236463546753} +11/06/2021 22:01:23 - INFO - __main__ - Step 5473: {'lr': 0.0004993213448142939, 'samples': 1050816, 'steps': 5472, 'loss/train': 2.2860300540924072} +11/06/2021 22:01:24 - INFO - __main__ - Step 5474: {'lr': 0.0004993209540046846, 'samples': 1051008, 'steps': 5473, 'loss/train': 2.309166431427002} +11/06/2021 22:01:24 - INFO - __main__ - Step 5475: {'lr': 0.0004993205630827352, 'samples': 1051200, 'steps': 5474, 'loss/train': 1.8463259935379028} +11/06/2021 22:01:24 - INFO - __main__ - Step 5476: {'lr': 0.0004993201720484458, 'samples': 1051392, 'steps': 5475, 'loss/train': 1.8536326885223389} +11/06/2021 22:01:25 - INFO - __main__ - Step 5477: {'lr': 0.0004993197809018165, 'samples': 1051584, 'steps': 5476, 'loss/train': 1.8011512756347656} +11/06/2021 22:01:26 - INFO - __main__ - Step 5478: {'lr': 0.0004993193896428476, 'samples': 1051776, 'steps': 5477, 'loss/train': 1.370781421661377} +11/06/2021 22:01:26 - INFO - __main__ - Step 5479: {'lr': 0.0004993189982715392, 'samples': 1051968, 'steps': 5478, 'loss/train': 1.9263511896133423} +11/06/2021 22:01:26 - INFO - __main__ - Step 5480: {'lr': 0.0004993186067878916, 'samples': 1052160, 'steps': 5479, 'loss/train': 1.3620198965072632} +11/06/2021 22:01:27 - INFO - __main__ - Step 5481: {'lr': 0.0004993182151919049, 'samples': 1052352, 'steps': 5480, 'loss/train': 2.0209407806396484} +11/06/2021 22:01:27 - INFO - __main__ - Step 5482: {'lr': 0.0004993178234835792, 'samples': 1052544, 'steps': 5481, 'loss/train': 1.6855971813201904} +11/06/2021 22:01:28 - INFO - __main__ - Step 5483: {'lr': 0.0004993174316629146, 'samples': 1052736, 'steps': 5482, 'loss/train': 2.446448802947998} +11/06/2021 22:01:28 - INFO - __main__ - Step 5484: {'lr': 0.0004993170397299116, 'samples': 1052928, 'steps': 5483, 'loss/train': 1.8740376234054565} +11/06/2021 22:01:29 - INFO - __main__ - Step 5485: {'lr': 0.0004993166476845701, 'samples': 1053120, 'steps': 5484, 'loss/train': 2.2243385314941406} +11/06/2021 22:01:29 - INFO - __main__ - Step 5486: {'lr': 0.0004993162555268903, 'samples': 1053312, 'steps': 5485, 'loss/train': 1.9227041006088257} +11/06/2021 22:01:29 - INFO - __main__ - Step 5487: {'lr': 0.0004993158632568726, 'samples': 1053504, 'steps': 5486, 'loss/train': 2.1195530891418457} +11/06/2021 22:01:30 - INFO - __main__ - Step 5488: {'lr': 0.000499315470874517, 'samples': 1053696, 'steps': 5487, 'loss/train': 2.2419090270996094} +11/06/2021 22:01:31 - INFO - __main__ - Step 5489: {'lr': 0.0004993150783798236, 'samples': 1053888, 'steps': 5488, 'loss/train': 2.4271090030670166} +11/06/2021 22:01:31 - INFO - __main__ - Step 5490: {'lr': 0.0004993146857727927, 'samples': 1054080, 'steps': 5489, 'loss/train': 1.7117938995361328} +11/06/2021 22:01:31 - INFO - __main__ - Step 5491: {'lr': 0.0004993142930534245, 'samples': 1054272, 'steps': 5490, 'loss/train': 1.232141375541687} +11/06/2021 22:01:32 - INFO - __main__ - Step 5492: {'lr': 0.000499313900221719, 'samples': 1054464, 'steps': 5491, 'loss/train': 1.8107589483261108} +11/06/2021 22:01:33 - INFO - __main__ - Step 5493: {'lr': 0.0004993135072776766, 'samples': 1054656, 'steps': 5492, 'loss/train': 2.035764694213867} +11/06/2021 22:01:33 - INFO - __main__ - Step 5494: {'lr': 0.0004993131142212974, 'samples': 1054848, 'steps': 5493, 'loss/train': 1.9107087850570679} +11/06/2021 22:01:33 - INFO - __main__ - Step 5495: {'lr': 0.0004993127210525815, 'samples': 1055040, 'steps': 5494, 'loss/train': 1.5598526000976562} +11/06/2021 22:01:34 - INFO - __main__ - Step 5496: {'lr': 0.0004993123277715292, 'samples': 1055232, 'steps': 5495, 'loss/train': 1.6145435571670532} +11/06/2021 22:01:34 - INFO - __main__ - Step 5497: {'lr': 0.0004993119343781406, 'samples': 1055424, 'steps': 5496, 'loss/train': 1.697355031967163} +11/06/2021 22:01:35 - INFO - __main__ - Step 5498: {'lr': 0.0004993115408724159, 'samples': 1055616, 'steps': 5497, 'loss/train': 1.3558404445648193} +11/06/2021 22:01:36 - INFO - __main__ - Step 5499: {'lr': 0.0004993111472543552, 'samples': 1055808, 'steps': 5498, 'loss/train': 1.6926814317703247} +11/06/2021 22:01:36 - INFO - __main__ - Step 5500: {'lr': 0.0004993107535239588, 'samples': 1056000, 'steps': 5499, 'loss/train': 1.3640247583389282} +11/06/2021 22:01:36 - INFO - __main__ - Step 5501: {'lr': 0.0004993103596812267, 'samples': 1056192, 'steps': 5500, 'loss/train': 1.8864690065383911} +11/06/2021 22:01:37 - INFO - __main__ - Step 5502: {'lr': 0.0004993099657261594, 'samples': 1056384, 'steps': 5501, 'loss/train': 2.0299696922302246} +11/06/2021 22:01:37 - INFO - __main__ - Step 5503: {'lr': 0.0004993095716587568, 'samples': 1056576, 'steps': 5502, 'loss/train': 2.2388596534729004} +11/06/2021 22:01:38 - INFO - __main__ - Step 5504: {'lr': 0.0004993091774790191, 'samples': 1056768, 'steps': 5503, 'loss/train': 1.5079683065414429} +11/06/2021 22:01:38 - INFO - __main__ - Step 5505: {'lr': 0.0004993087831869466, 'samples': 1056960, 'steps': 5504, 'loss/train': 2.0037267208099365} +11/06/2021 22:01:39 - INFO - __main__ - Step 5506: {'lr': 0.0004993083887825393, 'samples': 1057152, 'steps': 5505, 'loss/train': 2.18703556060791} +11/06/2021 22:01:39 - INFO - __main__ - Step 5507: {'lr': 0.0004993079942657976, 'samples': 1057344, 'steps': 5506, 'loss/train': 1.9802910089492798} +11/06/2021 22:01:39 - INFO - __main__ - Step 5508: {'lr': 0.0004993075996367215, 'samples': 1057536, 'steps': 5507, 'loss/train': 2.6383426189422607} +11/06/2021 22:01:40 - INFO - __main__ - Step 5509: {'lr': 0.0004993072048953113, 'samples': 1057728, 'steps': 5508, 'loss/train': 2.038627862930298} +11/06/2021 22:01:41 - INFO - __main__ - Step 5510: {'lr': 0.0004993068100415671, 'samples': 1057920, 'steps': 5509, 'loss/train': 1.877155065536499} +11/06/2021 22:01:41 - INFO - __main__ - Step 5511: {'lr': 0.000499306415075489, 'samples': 1058112, 'steps': 5510, 'loss/train': 1.7391774654388428} +11/06/2021 22:01:41 - INFO - __main__ - Step 5512: {'lr': 0.0004993060199970774, 'samples': 1058304, 'steps': 5511, 'loss/train': 2.053729772567749} +11/06/2021 22:01:42 - INFO - __main__ - Step 5513: {'lr': 0.0004993056248063323, 'samples': 1058496, 'steps': 5512, 'loss/train': 2.05024790763855} +11/06/2021 22:01:43 - INFO - __main__ - Step 5514: {'lr': 0.000499305229503254, 'samples': 1058688, 'steps': 5513, 'loss/train': 1.8646981716156006} +11/06/2021 22:01:43 - INFO - __main__ - Step 5515: {'lr': 0.0004993048340878425, 'samples': 1058880, 'steps': 5514, 'loss/train': 2.1601507663726807} +11/06/2021 22:01:44 - INFO - __main__ - Step 5516: {'lr': 0.0004993044385600982, 'samples': 1059072, 'steps': 5515, 'loss/train': 1.9711893796920776} +11/06/2021 22:01:44 - INFO - __main__ - Step 5517: {'lr': 0.0004993040429200211, 'samples': 1059264, 'steps': 5516, 'loss/train': 2.012702465057373} +11/06/2021 22:01:44 - INFO - __main__ - Step 5518: {'lr': 0.0004993036471676115, 'samples': 1059456, 'steps': 5517, 'loss/train': 1.4311362504959106} +11/06/2021 22:01:45 - INFO - __main__ - Step 5519: {'lr': 0.0004993032513028695, 'samples': 1059648, 'steps': 5518, 'loss/train': 1.7759687900543213} +11/06/2021 22:01:45 - INFO - __main__ - Step 5520: {'lr': 0.0004993028553257952, 'samples': 1059840, 'steps': 5519, 'loss/train': 2.569220781326294} +11/06/2021 22:01:46 - INFO - __main__ - Step 5521: {'lr': 0.000499302459236389, 'samples': 1060032, 'steps': 5520, 'loss/train': 1.6093146800994873} +11/06/2021 22:01:46 - INFO - __main__ - Step 5522: {'lr': 0.0004993020630346509, 'samples': 1060224, 'steps': 5521, 'loss/train': 2.444692611694336} +11/06/2021 22:01:47 - INFO - __main__ - Step 5523: {'lr': 0.0004993016667205812, 'samples': 1060416, 'steps': 5522, 'loss/train': 2.1542999744415283} +11/06/2021 22:01:48 - INFO - __main__ - Step 5524: {'lr': 0.0004993012702941799, 'samples': 1060608, 'steps': 5523, 'loss/train': 1.754870891571045} +11/06/2021 22:01:48 - INFO - __main__ - Step 5525: {'lr': 0.0004993008737554474, 'samples': 1060800, 'steps': 5524, 'loss/train': 1.7959246635437012} +11/06/2021 22:01:48 - INFO - __main__ - Step 5526: {'lr': 0.0004993004771043837, 'samples': 1060992, 'steps': 5525, 'loss/train': 2.041109800338745} +11/06/2021 22:01:49 - INFO - __main__ - Step 5527: {'lr': 0.0004993000803409891, 'samples': 1061184, 'steps': 5526, 'loss/train': 2.20894455909729} +11/06/2021 22:01:49 - INFO - __main__ - Step 5528: {'lr': 0.0004992996834652638, 'samples': 1061376, 'steps': 5527, 'loss/train': 1.942233681678772} +11/06/2021 22:01:50 - INFO - __main__ - Step 5529: {'lr': 0.0004992992864772079, 'samples': 1061568, 'steps': 5528, 'loss/train': 1.7475767135620117} +11/06/2021 22:01:50 - INFO - __main__ - Step 5530: {'lr': 0.0004992988893768214, 'samples': 1061760, 'steps': 5529, 'loss/train': 2.076091766357422} +11/06/2021 22:01:51 - INFO - __main__ - Step 5531: {'lr': 0.0004992984921641048, 'samples': 1061952, 'steps': 5530, 'loss/train': 2.0082509517669678} +11/06/2021 22:01:51 - INFO - __main__ - Step 5532: {'lr': 0.0004992980948390582, 'samples': 1062144, 'steps': 5531, 'loss/train': 1.9930384159088135} +11/06/2021 22:01:51 - INFO - __main__ - Step 5533: {'lr': 0.0004992976974016817, 'samples': 1062336, 'steps': 5532, 'loss/train': 2.128443479537964} +11/06/2021 22:01:52 - INFO - __main__ - Step 5534: {'lr': 0.0004992972998519755, 'samples': 1062528, 'steps': 5533, 'loss/train': 1.8396596908569336} +11/06/2021 22:01:53 - INFO - __main__ - Step 5535: {'lr': 0.0004992969021899397, 'samples': 1062720, 'steps': 5534, 'loss/train': 1.7834552526474} +11/06/2021 22:01:53 - INFO - __main__ - Step 5536: {'lr': 0.0004992965044155746, 'samples': 1062912, 'steps': 5535, 'loss/train': 1.7400227785110474} +11/06/2021 22:01:54 - INFO - __main__ - Step 5537: {'lr': 0.0004992961065288803, 'samples': 1063104, 'steps': 5536, 'loss/train': 1.9240829944610596} +11/06/2021 22:01:54 - INFO - __main__ - Step 5538: {'lr': 0.0004992957085298571, 'samples': 1063296, 'steps': 5537, 'loss/train': 1.3260631561279297} +11/06/2021 22:01:54 - INFO - __main__ - Step 5539: {'lr': 0.0004992953104185052, 'samples': 1063488, 'steps': 5538, 'loss/train': 1.4942200183868408} +11/06/2021 22:01:55 - INFO - __main__ - Step 5540: {'lr': 0.0004992949121948245, 'samples': 1063680, 'steps': 5539, 'loss/train': 1.48552668094635} +11/06/2021 22:01:56 - INFO - __main__ - Step 5541: {'lr': 0.0004992945138588154, 'samples': 1063872, 'steps': 5540, 'loss/train': 1.611240267753601} +11/06/2021 22:01:56 - INFO - __main__ - Step 5542: {'lr': 0.0004992941154104781, 'samples': 1064064, 'steps': 5541, 'loss/train': 1.437373399734497} +11/06/2021 22:01:56 - INFO - __main__ - Step 5543: {'lr': 0.0004992937168498126, 'samples': 1064256, 'steps': 5542, 'loss/train': 1.7761310338974} +11/06/2021 22:01:57 - INFO - __main__ - Step 5544: {'lr': 0.0004992933181768194, 'samples': 1064448, 'steps': 5543, 'loss/train': 2.0214922428131104} +11/06/2021 22:01:58 - INFO - __main__ - Step 5545: {'lr': 0.0004992929193914983, 'samples': 1064640, 'steps': 5544, 'loss/train': 1.7681033611297607} +11/06/2021 22:01:58 - INFO - __main__ - Step 5546: {'lr': 0.0004992925204938498, 'samples': 1064832, 'steps': 5545, 'loss/train': 2.075996160507202} +11/06/2021 22:01:59 - INFO - __main__ - Step 5547: {'lr': 0.0004992921214838738, 'samples': 1065024, 'steps': 5546, 'loss/train': 1.834026575088501} +11/06/2021 22:01:59 - INFO - __main__ - Step 5548: {'lr': 0.0004992917223615706, 'samples': 1065216, 'steps': 5547, 'loss/train': 1.4636272192001343} +11/06/2021 22:01:59 - INFO - __main__ - Step 5549: {'lr': 0.0004992913231269405, 'samples': 1065408, 'steps': 5548, 'loss/train': 1.9245575666427612} +11/06/2021 22:02:00 - INFO - __main__ - Step 5550: {'lr': 0.0004992909237799835, 'samples': 1065600, 'steps': 5549, 'loss/train': 2.2728660106658936} +11/06/2021 22:02:01 - INFO - __main__ - Step 5551: {'lr': 0.0004992905243206999, 'samples': 1065792, 'steps': 5550, 'loss/train': 1.8605475425720215} +11/06/2021 22:02:01 - INFO - __main__ - Step 5552: {'lr': 0.0004992901247490899, 'samples': 1065984, 'steps': 5551, 'loss/train': 2.065237522125244} +11/06/2021 22:02:01 - INFO - __main__ - Step 5553: {'lr': 0.0004992897250651535, 'samples': 1066176, 'steps': 5552, 'loss/train': 2.103445529937744} +11/06/2021 22:02:02 - INFO - __main__ - Step 5554: {'lr': 0.000499289325268891, 'samples': 1066368, 'steps': 5553, 'loss/train': 1.8733552694320679} +11/06/2021 22:02:03 - INFO - __main__ - Step 5555: {'lr': 0.0004992889253603027, 'samples': 1066560, 'steps': 5554, 'loss/train': 1.6204419136047363} +11/06/2021 22:02:03 - INFO - __main__ - Step 5556: {'lr': 0.0004992885253393885, 'samples': 1066752, 'steps': 5555, 'loss/train': 1.7640080451965332} +11/06/2021 22:02:04 - INFO - __main__ - Step 5557: {'lr': 0.0004992881252061489, 'samples': 1066944, 'steps': 5556, 'loss/train': 1.724705457687378} +11/06/2021 22:02:04 - INFO - __main__ - Step 5558: {'lr': 0.0004992877249605838, 'samples': 1067136, 'steps': 5557, 'loss/train': 2.2034895420074463} +11/06/2021 22:02:04 - INFO - __main__ - Step 5559: {'lr': 0.0004992873246026935, 'samples': 1067328, 'steps': 5558, 'loss/train': 2.039024591445923} +11/06/2021 22:02:05 - INFO - __main__ - Step 5560: {'lr': 0.0004992869241324783, 'samples': 1067520, 'steps': 5559, 'loss/train': 1.9477410316467285} +11/06/2021 22:02:06 - INFO - __main__ - Step 5561: {'lr': 0.000499286523549938, 'samples': 1067712, 'steps': 5560, 'loss/train': 1.9774774312973022} +11/06/2021 22:02:06 - INFO - __main__ - Step 5562: {'lr': 0.0004992861228550733, 'samples': 1067904, 'steps': 5561, 'loss/train': 2.137509822845459} +11/06/2021 22:02:06 - INFO - __main__ - Step 5563: {'lr': 0.0004992857220478841, 'samples': 1068096, 'steps': 5562, 'loss/train': 1.9436842203140259} +11/06/2021 22:02:07 - INFO - __main__ - Step 5564: {'lr': 0.0004992853211283705, 'samples': 1068288, 'steps': 5563, 'loss/train': 2.0045459270477295} +11/06/2021 22:02:08 - INFO - __main__ - Step 5565: {'lr': 0.0004992849200965327, 'samples': 1068480, 'steps': 5564, 'loss/train': 1.8353327512741089} +11/06/2021 22:02:08 - INFO - __main__ - Step 5566: {'lr': 0.0004992845189523711, 'samples': 1068672, 'steps': 5565, 'loss/train': 2.0094947814941406} +11/06/2021 22:02:08 - INFO - __main__ - Step 5567: {'lr': 0.0004992841176958858, 'samples': 1068864, 'steps': 5566, 'loss/train': 1.8892325162887573} +11/06/2021 22:02:09 - INFO - __main__ - Step 5568: {'lr': 0.0004992837163270769, 'samples': 1069056, 'steps': 5567, 'loss/train': 1.280644178390503} +11/06/2021 22:02:09 - INFO - __main__ - Step 5569: {'lr': 0.0004992833148459445, 'samples': 1069248, 'steps': 5568, 'loss/train': 2.168335199356079} +11/06/2021 22:02:10 - INFO - __main__ - Step 5570: {'lr': 0.0004992829132524889, 'samples': 1069440, 'steps': 5569, 'loss/train': 1.7364050149917603} +11/06/2021 22:02:11 - INFO - __main__ - Step 5571: {'lr': 0.0004992825115467102, 'samples': 1069632, 'steps': 5570, 'loss/train': 1.8209835290908813} +11/06/2021 22:02:11 - INFO - __main__ - Step 5572: {'lr': 0.0004992821097286088, 'samples': 1069824, 'steps': 5571, 'loss/train': 2.0928235054016113} +11/06/2021 22:02:11 - INFO - __main__ - Step 5573: {'lr': 0.0004992817077981846, 'samples': 1070016, 'steps': 5572, 'loss/train': 1.939453125} +11/06/2021 22:02:12 - INFO - __main__ - Step 5574: {'lr': 0.000499281305755438, 'samples': 1070208, 'steps': 5573, 'loss/train': 1.4345474243164062} +11/06/2021 22:02:13 - INFO - __main__ - Step 5575: {'lr': 0.0004992809036003691, 'samples': 1070400, 'steps': 5574, 'loss/train': 1.5226601362228394} +11/06/2021 22:02:13 - INFO - __main__ - Step 5576: {'lr': 0.000499280501332978, 'samples': 1070592, 'steps': 5575, 'loss/train': 1.6950485706329346} +11/06/2021 22:02:13 - INFO - __main__ - Step 5577: {'lr': 0.000499280098953265, 'samples': 1070784, 'steps': 5576, 'loss/train': 1.7863175868988037} +11/06/2021 22:02:14 - INFO - __main__ - Step 5578: {'lr': 0.0004992796964612302, 'samples': 1070976, 'steps': 5577, 'loss/train': 2.1370227336883545} +11/06/2021 22:02:14 - INFO - __main__ - Step 5579: {'lr': 0.0004992792938568739, 'samples': 1071168, 'steps': 5578, 'loss/train': 1.6954041719436646} +11/06/2021 22:02:15 - INFO - __main__ - Step 5580: {'lr': 0.0004992788911401961, 'samples': 1071360, 'steps': 5579, 'loss/train': 1.965846300125122} +11/06/2021 22:02:15 - INFO - __main__ - Step 5581: {'lr': 0.0004992784883111972, 'samples': 1071552, 'steps': 5580, 'loss/train': 2.0566160678863525} +11/06/2021 22:02:16 - INFO - __main__ - Step 5582: {'lr': 0.0004992780853698771, 'samples': 1071744, 'steps': 5581, 'loss/train': 2.0826704502105713} +11/06/2021 22:02:16 - INFO - __main__ - Step 5583: {'lr': 0.0004992776823162362, 'samples': 1071936, 'steps': 5582, 'loss/train': 1.6253973245620728} +11/06/2021 22:02:16 - INFO - __main__ - Step 5584: {'lr': 0.0004992772791502746, 'samples': 1072128, 'steps': 5583, 'loss/train': 1.7292557954788208} +11/06/2021 22:02:18 - INFO - __main__ - Step 5585: {'lr': 0.0004992768758719926, 'samples': 1072320, 'steps': 5584, 'loss/train': 2.4336965084075928} +11/06/2021 22:02:18 - INFO - __main__ - Step 5586: {'lr': 0.0004992764724813902, 'samples': 1072512, 'steps': 5585, 'loss/train': 1.5816513299942017} +11/06/2021 22:02:18 - INFO - __main__ - Step 5587: {'lr': 0.0004992760689784677, 'samples': 1072704, 'steps': 5586, 'loss/train': 1.2834484577178955} +11/06/2021 22:02:19 - INFO - __main__ - Step 5588: {'lr': 0.0004992756653632252, 'samples': 1072896, 'steps': 5587, 'loss/train': 2.1524899005889893} +11/06/2021 22:02:19 - INFO - __main__ - Step 5589: {'lr': 0.0004992752616356631, 'samples': 1073088, 'steps': 5588, 'loss/train': 2.2790422439575195} +11/06/2021 22:02:19 - INFO - __main__ - Step 5590: {'lr': 0.0004992748577957812, 'samples': 1073280, 'steps': 5589, 'loss/train': 1.7279716730117798} +11/06/2021 22:02:21 - INFO - __main__ - Step 5591: {'lr': 0.00049927445384358, 'samples': 1073472, 'steps': 5590, 'loss/train': 1.8624963760375977} +11/06/2021 22:02:21 - INFO - __main__ - Step 5592: {'lr': 0.0004992740497790595, 'samples': 1073664, 'steps': 5591, 'loss/train': 2.11755108833313} +11/06/2021 22:02:21 - INFO - __main__ - Step 5593: {'lr': 0.0004992736456022201, 'samples': 1073856, 'steps': 5592, 'loss/train': 6.259105205535889} +11/06/2021 22:02:22 - INFO - __main__ - Step 5594: {'lr': 0.0004992732413130617, 'samples': 1074048, 'steps': 5593, 'loss/train': 2.766812562942505} +11/06/2021 22:02:22 - INFO - __main__ - Step 5595: {'lr': 0.0004992728369115848, 'samples': 1074240, 'steps': 5594, 'loss/train': 0.8529731631278992} +11/06/2021 22:02:22 - INFO - __main__ - Step 5596: {'lr': 0.0004992724323977893, 'samples': 1074432, 'steps': 5595, 'loss/train': 1.5423051118850708} +11/06/2021 22:02:23 - INFO - __main__ - Step 5597: {'lr': 0.0004992720277716755, 'samples': 1074624, 'steps': 5596, 'loss/train': 1.7895461320877075} +11/06/2021 22:02:24 - INFO - __main__ - Step 5598: {'lr': 0.0004992716230332435, 'samples': 1074816, 'steps': 5597, 'loss/train': 1.8931951522827148} +11/06/2021 22:02:24 - INFO - __main__ - Step 5599: {'lr': 0.0004992712181824936, 'samples': 1075008, 'steps': 5598, 'loss/train': 2.938845634460449} +11/06/2021 22:02:24 - INFO - __main__ - Step 5600: {'lr': 0.0004992708132194259, 'samples': 1075200, 'steps': 5599, 'loss/train': 1.7190282344818115} +11/06/2021 22:02:25 - INFO - __main__ - Step 5601: {'lr': 0.0004992704081440407, 'samples': 1075392, 'steps': 5600, 'loss/train': 2.1930367946624756} +11/06/2021 22:02:26 - INFO - __main__ - Step 5602: {'lr': 0.0004992700029563381, 'samples': 1075584, 'steps': 5601, 'loss/train': 1.8844269514083862} +11/06/2021 22:02:26 - INFO - __main__ - Step 5603: {'lr': 0.0004992695976563182, 'samples': 1075776, 'steps': 5602, 'loss/train': 2.1230838298797607} +11/06/2021 22:02:26 - INFO - __main__ - Step 5604: {'lr': 0.0004992691922439814, 'samples': 1075968, 'steps': 5603, 'loss/train': 1.6668339967727661} +11/06/2021 22:02:27 - INFO - __main__ - Step 5605: {'lr': 0.0004992687867193277, 'samples': 1076160, 'steps': 5604, 'loss/train': 1.7833575010299683} +11/06/2021 22:02:27 - INFO - __main__ - Step 5606: {'lr': 0.0004992683810823572, 'samples': 1076352, 'steps': 5605, 'loss/train': 1.914794683456421} +11/06/2021 22:02:28 - INFO - __main__ - Step 5607: {'lr': 0.0004992679753330703, 'samples': 1076544, 'steps': 5606, 'loss/train': 1.698716163635254} +11/06/2021 22:02:28 - INFO - __main__ - Step 5608: {'lr': 0.0004992675694714671, 'samples': 1076736, 'steps': 5607, 'loss/train': 2.1556620597839355} +11/06/2021 22:02:29 - INFO - __main__ - Step 5609: {'lr': 0.0004992671634975477, 'samples': 1076928, 'steps': 5608, 'loss/train': 1.4872366189956665} +11/06/2021 22:02:29 - INFO - __main__ - Step 5610: {'lr': 0.0004992667574113125, 'samples': 1077120, 'steps': 5609, 'loss/train': 1.928450345993042} +11/06/2021 22:02:29 - INFO - __main__ - Step 5611: {'lr': 0.0004992663512127615, 'samples': 1077312, 'steps': 5610, 'loss/train': 2.2512283325195312} +11/06/2021 22:02:31 - INFO - __main__ - Step 5612: {'lr': 0.0004992659449018949, 'samples': 1077504, 'steps': 5611, 'loss/train': 1.50386643409729} +11/06/2021 22:02:31 - INFO - __main__ - Step 5613: {'lr': 0.0004992655384787129, 'samples': 1077696, 'steps': 5612, 'loss/train': 2.3416426181793213} +11/06/2021 22:02:31 - INFO - __main__ - Step 5614: {'lr': 0.0004992651319432157, 'samples': 1077888, 'steps': 5613, 'loss/train': 2.967033863067627} +11/06/2021 22:02:32 - INFO - __main__ - Step 5615: {'lr': 0.0004992647252954035, 'samples': 1078080, 'steps': 5614, 'loss/train': 2.203519582748413} +11/06/2021 22:02:32 - INFO - __main__ - Step 5616: {'lr': 0.0004992643185352765, 'samples': 1078272, 'steps': 5615, 'loss/train': 2.0697097778320312} +11/06/2021 22:02:32 - INFO - __main__ - Step 5617: {'lr': 0.0004992639116628349, 'samples': 1078464, 'steps': 5616, 'loss/train': 2.1669209003448486} +11/06/2021 22:02:34 - INFO - __main__ - Step 5618: {'lr': 0.0004992635046780786, 'samples': 1078656, 'steps': 5617, 'loss/train': 2.434951066970825} +11/06/2021 22:02:34 - INFO - __main__ - Step 5619: {'lr': 0.0004992630975810083, 'samples': 1078848, 'steps': 5618, 'loss/train': 2.055948257446289} +11/06/2021 22:02:35 - INFO - __main__ - Step 5620: {'lr': 0.0004992626903716237, 'samples': 1079040, 'steps': 5619, 'loss/train': 0.3906489312648773} +11/06/2021 22:02:35 - INFO - __main__ - Step 5621: {'lr': 0.0004992622830499252, 'samples': 1079232, 'steps': 5620, 'loss/train': 0.3192686438560486} +11/06/2021 22:02:35 - INFO - __main__ - Step 5622: {'lr': 0.000499261875615913, 'samples': 1079424, 'steps': 5621, 'loss/train': 1.627442479133606} +11/06/2021 22:02:36 - INFO - __main__ - Step 5623: {'lr': 0.0004992614680695872, 'samples': 1079616, 'steps': 5622, 'loss/train': 2.138500452041626} +11/06/2021 22:02:37 - INFO - __main__ - Step 5624: {'lr': 0.0004992610604109481, 'samples': 1079808, 'steps': 5623, 'loss/train': 2.165574312210083} +11/06/2021 22:02:37 - INFO - __main__ - Step 5625: {'lr': 0.0004992606526399957, 'samples': 1080000, 'steps': 5624, 'loss/train': 1.8479472398757935} +11/06/2021 22:02:37 - INFO - __main__ - Step 5626: {'lr': 0.0004992602447567304, 'samples': 1080192, 'steps': 5625, 'loss/train': 2.4740467071533203} +11/06/2021 22:02:38 - INFO - __main__ - Step 5627: {'lr': 0.0004992598367611523, 'samples': 1080384, 'steps': 5626, 'loss/train': 1.5033149719238281} +11/06/2021 22:02:38 - INFO - __main__ - Step 5628: {'lr': 0.0004992594286532615, 'samples': 1080576, 'steps': 5627, 'loss/train': 1.958828330039978} +11/06/2021 22:02:39 - INFO - __main__ - Step 5629: {'lr': 0.0004992590204330583, 'samples': 1080768, 'steps': 5628, 'loss/train': 1.696641445159912} +11/06/2021 22:02:39 - INFO - __main__ - Step 5630: {'lr': 0.0004992586121005427, 'samples': 1080960, 'steps': 5629, 'loss/train': 0.8877306580543518} +11/06/2021 22:02:40 - INFO - __main__ - Step 5631: {'lr': 0.0004992582036557152, 'samples': 1081152, 'steps': 5630, 'loss/train': 2.333393096923828} +11/06/2021 22:02:40 - INFO - __main__ - Step 5632: {'lr': 0.0004992577950985757, 'samples': 1081344, 'steps': 5631, 'loss/train': 2.0259532928466797} +11/06/2021 22:02:40 - INFO - __main__ - Step 5633: {'lr': 0.0004992573864291244, 'samples': 1081536, 'steps': 5632, 'loss/train': 1.8936342000961304} +11/06/2021 22:02:41 - INFO - __main__ - Step 5634: {'lr': 0.0004992569776473616, 'samples': 1081728, 'steps': 5633, 'loss/train': 1.8749663829803467} +11/06/2021 22:02:42 - INFO - __main__ - Step 5635: {'lr': 0.0004992565687532875, 'samples': 1081920, 'steps': 5634, 'loss/train': 1.5571837425231934} +11/06/2021 22:02:42 - INFO - __main__ - Step 5636: {'lr': 0.0004992561597469023, 'samples': 1082112, 'steps': 5635, 'loss/train': 2.0260841846466064} +11/06/2021 22:02:42 - INFO - __main__ - Step 5637: {'lr': 0.0004992557506282061, 'samples': 1082304, 'steps': 5636, 'loss/train': 1.9845712184906006} +11/06/2021 22:02:43 - INFO - __main__ - Step 5638: {'lr': 0.0004992553413971991, 'samples': 1082496, 'steps': 5637, 'loss/train': 1.8022942543029785} +11/06/2021 22:02:44 - INFO - __main__ - Step 5639: {'lr': 0.0004992549320538814, 'samples': 1082688, 'steps': 5638, 'loss/train': 2.3104302883148193} +11/06/2021 22:02:44 - INFO - __main__ - Step 5640: {'lr': 0.0004992545225982533, 'samples': 1082880, 'steps': 5639, 'loss/train': 1.7610740661621094} +11/06/2021 22:02:45 - INFO - __main__ - Step 5641: {'lr': 0.000499254113030315, 'samples': 1083072, 'steps': 5640, 'loss/train': 1.8128447532653809} +11/06/2021 22:02:45 - INFO - __main__ - Step 5642: {'lr': 0.0004992537033500667, 'samples': 1083264, 'steps': 5641, 'loss/train': 1.8965189456939697} +11/06/2021 22:02:45 - INFO - __main__ - Step 5643: {'lr': 0.0004992532935575084, 'samples': 1083456, 'steps': 5642, 'loss/train': 2.2873661518096924} +11/06/2021 22:02:46 - INFO - __main__ - Step 5644: {'lr': 0.0004992528836526405, 'samples': 1083648, 'steps': 5643, 'loss/train': 2.314706325531006} +11/06/2021 22:02:47 - INFO - __main__ - Step 5645: {'lr': 0.0004992524736354631, 'samples': 1083840, 'steps': 5644, 'loss/train': 2.096315622329712} +11/06/2021 22:02:47 - INFO - __main__ - Step 5646: {'lr': 0.0004992520635059762, 'samples': 1084032, 'steps': 5645, 'loss/train': 1.736008644104004} +11/06/2021 22:02:47 - INFO - __main__ - Step 5647: {'lr': 0.0004992516532641804, 'samples': 1084224, 'steps': 5646, 'loss/train': 1.71793794631958} +11/06/2021 22:02:48 - INFO - __main__ - Step 5648: {'lr': 0.0004992512429100757, 'samples': 1084416, 'steps': 5647, 'loss/train': 1.7612890005111694} +11/06/2021 22:02:49 - INFO - __main__ - Step 5649: {'lr': 0.000499250832443662, 'samples': 1084608, 'steps': 5648, 'loss/train': 2.2662413120269775} +11/06/2021 22:02:49 - INFO - __main__ - Step 5650: {'lr': 0.0004992504218649398, 'samples': 1084800, 'steps': 5649, 'loss/train': 1.443153977394104} +11/06/2021 22:02:50 - INFO - __main__ - Step 5651: {'lr': 0.0004992500111739093, 'samples': 1084992, 'steps': 5650, 'loss/train': 2.055508852005005} +11/06/2021 22:02:50 - INFO - __main__ - Step 5652: {'lr': 0.0004992496003705705, 'samples': 1085184, 'steps': 5651, 'loss/train': 2.131808042526245} +11/06/2021 22:02:50 - INFO - __main__ - Step 5653: {'lr': 0.0004992491894549236, 'samples': 1085376, 'steps': 5652, 'loss/train': 1.7326874732971191} +11/06/2021 22:02:51 - INFO - __main__ - Step 5654: {'lr': 0.000499248778426969, 'samples': 1085568, 'steps': 5653, 'loss/train': 2.14742374420166} +11/06/2021 22:02:52 - INFO - __main__ - Step 5655: {'lr': 0.0004992483672867068, 'samples': 1085760, 'steps': 5654, 'loss/train': 1.887015461921692} +11/06/2021 22:02:52 - INFO - __main__ - Step 5656: {'lr': 0.000499247956034137, 'samples': 1085952, 'steps': 5655, 'loss/train': 0.4538571536540985} +11/06/2021 22:02:52 - INFO - __main__ - Step 5657: {'lr': 0.00049924754466926, 'samples': 1086144, 'steps': 5656, 'loss/train': 2.187472105026245} +11/06/2021 22:02:53 - INFO - __main__ - Step 5658: {'lr': 0.0004992471331920758, 'samples': 1086336, 'steps': 5657, 'loss/train': 1.9629387855529785} +11/06/2021 22:02:53 - INFO - __main__ - Step 5659: {'lr': 0.0004992467216025848, 'samples': 1086528, 'steps': 5658, 'loss/train': 2.4174067974090576} +11/06/2021 22:02:54 - INFO - __main__ - Step 5660: {'lr': 0.0004992463099007871, 'samples': 1086720, 'steps': 5659, 'loss/train': 1.6454474925994873} +11/06/2021 22:02:54 - INFO - __main__ - Step 5661: {'lr': 0.0004992458980866827, 'samples': 1086912, 'steps': 5660, 'loss/train': 1.8920400142669678} +11/06/2021 22:02:55 - INFO - __main__ - Step 5662: {'lr': 0.000499245486160272, 'samples': 1087104, 'steps': 5661, 'loss/train': 1.9282915592193604} +11/06/2021 22:02:55 - INFO - __main__ - Step 5663: {'lr': 0.0004992450741215552, 'samples': 1087296, 'steps': 5662, 'loss/train': 1.9078826904296875} +11/06/2021 22:02:55 - INFO - __main__ - Step 5664: {'lr': 0.0004992446619705324, 'samples': 1087488, 'steps': 5663, 'loss/train': 1.9330226182937622} +11/06/2021 22:02:56 - INFO - __main__ - Step 5665: {'lr': 0.0004992442497072037, 'samples': 1087680, 'steps': 5664, 'loss/train': 1.8962855339050293} +11/06/2021 22:02:57 - INFO - __main__ - Step 5666: {'lr': 0.0004992438373315694, 'samples': 1087872, 'steps': 5665, 'loss/train': 1.5366052389144897} +11/06/2021 22:02:57 - INFO - __main__ - Step 5667: {'lr': 0.0004992434248436298, 'samples': 1088064, 'steps': 5666, 'loss/train': 1.221272587776184} +11/06/2021 22:02:57 - INFO - __main__ - Step 5668: {'lr': 0.0004992430122433848, 'samples': 1088256, 'steps': 5667, 'loss/train': 1.9391791820526123} +11/06/2021 22:02:58 - INFO - __main__ - Step 5669: {'lr': 0.0004992425995308349, 'samples': 1088448, 'steps': 5668, 'loss/train': 1.7548898458480835} +11/06/2021 22:02:59 - INFO - __main__ - Step 5670: {'lr': 0.0004992421867059801, 'samples': 1088640, 'steps': 5669, 'loss/train': 1.8856055736541748} +11/06/2021 22:02:59 - INFO - __main__ - Step 5671: {'lr': 0.0004992417737688206, 'samples': 1088832, 'steps': 5670, 'loss/train': 1.850290298461914} +11/06/2021 22:02:59 - INFO - __main__ - Step 5672: {'lr': 0.0004992413607193566, 'samples': 1089024, 'steps': 5671, 'loss/train': 2.0641515254974365} +11/06/2021 22:03:00 - INFO - __main__ - Step 5673: {'lr': 0.0004992409475575882, 'samples': 1089216, 'steps': 5672, 'loss/train': 2.626786231994629} +11/06/2021 22:03:00 - INFO - __main__ - Step 5674: {'lr': 0.0004992405342835158, 'samples': 1089408, 'steps': 5673, 'loss/train': 1.913179636001587} +11/06/2021 22:03:01 - INFO - __main__ - Step 5675: {'lr': 0.0004992401208971394, 'samples': 1089600, 'steps': 5674, 'loss/train': 2.4290151596069336} +11/06/2021 22:03:02 - INFO - __main__ - Step 5676: {'lr': 0.0004992397073984592, 'samples': 1089792, 'steps': 5675, 'loss/train': 1.8842289447784424} +11/06/2021 22:03:02 - INFO - __main__ - Step 5677: {'lr': 0.0004992392937874755, 'samples': 1089984, 'steps': 5676, 'loss/train': 1.9053252935409546} +11/06/2021 22:03:02 - INFO - __main__ - Step 5678: {'lr': 0.0004992388800641885, 'samples': 1090176, 'steps': 5677, 'loss/train': 2.1851115226745605} +11/06/2021 22:03:03 - INFO - __main__ - Step 5679: {'lr': 0.0004992384662285981, 'samples': 1090368, 'steps': 5678, 'loss/train': 1.9551331996917725} +11/06/2021 22:03:04 - INFO - __main__ - Step 5680: {'lr': 0.0004992380522807049, 'samples': 1090560, 'steps': 5679, 'loss/train': 2.1385090351104736} +11/06/2021 22:03:04 - INFO - __main__ - Step 5681: {'lr': 0.0004992376382205088, 'samples': 1090752, 'steps': 5680, 'loss/train': 0.955967903137207} +11/06/2021 22:03:04 - INFO - __main__ - Step 5682: {'lr': 0.00049923722404801, 'samples': 1090944, 'steps': 5681, 'loss/train': 1.333667278289795} +11/06/2021 22:03:05 - INFO - __main__ - Step 5683: {'lr': 0.0004992368097632089, 'samples': 1091136, 'steps': 5682, 'loss/train': 2.1074047088623047} +11/06/2021 22:03:05 - INFO - __main__ - Step 5684: {'lr': 0.0004992363953661054, 'samples': 1091328, 'steps': 5683, 'loss/train': 1.597164273262024} +11/06/2021 22:03:06 - INFO - __main__ - Step 5685: {'lr': 0.0004992359808566999, 'samples': 1091520, 'steps': 5684, 'loss/train': 4.272282600402832} +11/06/2021 22:03:06 - INFO - __main__ - Step 5686: {'lr': 0.0004992355662349925, 'samples': 1091712, 'steps': 5685, 'loss/train': 2.0851457118988037} +11/06/2021 22:03:07 - INFO - __main__ - Step 5687: {'lr': 0.0004992351515009833, 'samples': 1091904, 'steps': 5686, 'loss/train': 1.8593014478683472} +11/06/2021 22:03:07 - INFO - __main__ - Step 5688: {'lr': 0.0004992347366546727, 'samples': 1092096, 'steps': 5687, 'loss/train': 2.107888698577881} +11/06/2021 22:03:07 - INFO - __main__ - Step 5689: {'lr': 0.0004992343216960607, 'samples': 1092288, 'steps': 5688, 'loss/train': 1.92064368724823} +11/06/2021 22:03:09 - INFO - __main__ - Step 5690: {'lr': 0.0004992339066251476, 'samples': 1092480, 'steps': 5689, 'loss/train': 1.6505532264709473} +11/06/2021 22:03:09 - INFO - __main__ - Step 5691: {'lr': 0.0004992334914419337, 'samples': 1092672, 'steps': 5690, 'loss/train': 1.4800523519515991} +11/06/2021 22:03:09 - INFO - __main__ - Step 5692: {'lr': 0.0004992330761464188, 'samples': 1092864, 'steps': 5691, 'loss/train': 1.566269874572754} +11/06/2021 22:03:10 - INFO - __main__ - Step 5693: {'lr': 0.0004992326607386034, 'samples': 1093056, 'steps': 5692, 'loss/train': 2.7816977500915527} +11/06/2021 22:03:10 - INFO - __main__ - Step 5694: {'lr': 0.0004992322452184876, 'samples': 1093248, 'steps': 5693, 'loss/train': 2.2784321308135986} +11/06/2021 22:03:10 - INFO - __main__ - Step 5695: {'lr': 0.0004992318295860718, 'samples': 1093440, 'steps': 5694, 'loss/train': 1.6132631301879883} +11/06/2021 22:03:11 - INFO - __main__ - Step 5696: {'lr': 0.0004992314138413557, 'samples': 1093632, 'steps': 5695, 'loss/train': 1.0506314039230347} +11/06/2021 22:03:12 - INFO - __main__ - Step 5697: {'lr': 0.0004992309979843398, 'samples': 1093824, 'steps': 5696, 'loss/train': 1.6640676259994507} +11/06/2021 22:03:12 - INFO - __main__ - Step 5698: {'lr': 0.0004992305820150243, 'samples': 1094016, 'steps': 5697, 'loss/train': 2.264589548110962} +11/06/2021 22:03:12 - INFO - __main__ - Step 5699: {'lr': 0.0004992301659334095, 'samples': 1094208, 'steps': 5698, 'loss/train': 1.779240369796753} +11/06/2021 22:03:13 - INFO - __main__ - Step 5700: {'lr': 0.0004992297497394953, 'samples': 1094400, 'steps': 5699, 'loss/train': 1.5789347887039185} +11/06/2021 22:03:14 - INFO - __main__ - Step 5701: {'lr': 0.000499229333433282, 'samples': 1094592, 'steps': 5700, 'loss/train': 1.8561713695526123} +11/06/2021 22:03:14 - INFO - __main__ - Step 5702: {'lr': 0.0004992289170147699, 'samples': 1094784, 'steps': 5701, 'loss/train': 2.206258535385132} +11/06/2021 22:03:15 - INFO - __main__ - Step 5703: {'lr': 0.000499228500483959, 'samples': 1094976, 'steps': 5702, 'loss/train': 1.1616374254226685} +11/06/2021 22:03:15 - INFO - __main__ - Step 5704: {'lr': 0.0004992280838408496, 'samples': 1095168, 'steps': 5703, 'loss/train': 2.011932611465454} +11/06/2021 22:03:15 - INFO - __main__ - Step 5705: {'lr': 0.0004992276670854419, 'samples': 1095360, 'steps': 5704, 'loss/train': 2.265223503112793} +11/06/2021 22:03:16 - INFO - __main__ - Step 5706: {'lr': 0.000499227250217736, 'samples': 1095552, 'steps': 5705, 'loss/train': 1.879677414894104} +11/06/2021 22:03:17 - INFO - __main__ - Step 5707: {'lr': 0.0004992268332377323, 'samples': 1095744, 'steps': 5706, 'loss/train': 1.6559354066848755} +11/06/2021 22:03:17 - INFO - __main__ - Step 5708: {'lr': 0.0004992264161454306, 'samples': 1095936, 'steps': 5707, 'loss/train': 2.132072925567627} +11/06/2021 22:03:17 - INFO - __main__ - Step 5709: {'lr': 0.0004992259989408316, 'samples': 1096128, 'steps': 5708, 'loss/train': 3.037383556365967} +11/06/2021 22:03:18 - INFO - __main__ - Step 5710: {'lr': 0.000499225581623935, 'samples': 1096320, 'steps': 5709, 'loss/train': 2.0813891887664795} +11/06/2021 22:03:18 - INFO - __main__ - Step 5711: {'lr': 0.0004992251641947412, 'samples': 1096512, 'steps': 5710, 'loss/train': 1.6070504188537598} +11/06/2021 22:03:19 - INFO - __main__ - Step 5712: {'lr': 0.0004992247466532504, 'samples': 1096704, 'steps': 5711, 'loss/train': 1.8336153030395508} +11/06/2021 22:03:20 - INFO - __main__ - Step 5713: {'lr': 0.0004992243289994629, 'samples': 1096896, 'steps': 5712, 'loss/train': 1.5240449905395508} +11/06/2021 22:03:20 - INFO - __main__ - Step 5714: {'lr': 0.0004992239112333787, 'samples': 1097088, 'steps': 5713, 'loss/train': 2.0184898376464844} +11/06/2021 22:03:20 - INFO - __main__ - Step 5715: {'lr': 0.000499223493354998, 'samples': 1097280, 'steps': 5714, 'loss/train': 1.668257713317871} +11/06/2021 22:03:21 - INFO - __main__ - Step 5716: {'lr': 0.0004992230753643211, 'samples': 1097472, 'steps': 5715, 'loss/train': 2.1014792919158936} +11/06/2021 22:03:22 - INFO - __main__ - Step 5717: {'lr': 0.0004992226572613481, 'samples': 1097664, 'steps': 5716, 'loss/train': 2.5767147541046143} +11/06/2021 22:03:22 - INFO - __main__ - Step 5718: {'lr': 0.0004992222390460792, 'samples': 1097856, 'steps': 5717, 'loss/train': 1.6296945810317993} +11/06/2021 22:03:23 - INFO - __main__ - Step 5719: {'lr': 0.0004992218207185146, 'samples': 1098048, 'steps': 5718, 'loss/train': 1.9573607444763184} +11/06/2021 22:03:23 - INFO - __main__ - Step 5720: {'lr': 0.0004992214022786546, 'samples': 1098240, 'steps': 5719, 'loss/train': 2.1646392345428467} +11/06/2021 22:03:23 - INFO - __main__ - Step 5721: {'lr': 0.0004992209837264991, 'samples': 1098432, 'steps': 5720, 'loss/train': 1.7333484888076782} +11/06/2021 22:03:24 - INFO - __main__ - Step 5722: {'lr': 0.0004992205650620487, 'samples': 1098624, 'steps': 5721, 'loss/train': 0.6370934844017029} +11/06/2021 22:03:25 - INFO - __main__ - Step 5723: {'lr': 0.0004992201462853032, 'samples': 1098816, 'steps': 5722, 'loss/train': 1.629151701927185} +11/06/2021 22:03:25 - INFO - __main__ - Step 5724: {'lr': 0.000499219727396263, 'samples': 1099008, 'steps': 5723, 'loss/train': 1.9365618228912354} +11/06/2021 22:03:25 - INFO - __main__ - Step 5725: {'lr': 0.0004992193083949282, 'samples': 1099200, 'steps': 5724, 'loss/train': 1.9601372480392456} +11/06/2021 22:03:26 - INFO - __main__ - Step 5726: {'lr': 0.000499218889281299, 'samples': 1099392, 'steps': 5725, 'loss/train': 2.3020355701446533} +11/06/2021 22:03:27 - INFO - __main__ - Step 5727: {'lr': 0.0004992184700553756, 'samples': 1099584, 'steps': 5726, 'loss/train': 1.6674587726593018} +11/06/2021 22:03:27 - INFO - __main__ - Step 5728: {'lr': 0.0004992180507171583, 'samples': 1099776, 'steps': 5727, 'loss/train': 1.6533688306808472} +11/06/2021 22:03:28 - INFO - __main__ - Step 5729: {'lr': 0.0004992176312666472, 'samples': 1099968, 'steps': 5728, 'loss/train': 2.2179229259490967} +11/06/2021 22:03:28 - INFO - __main__ - Step 5730: {'lr': 0.0004992172117038424, 'samples': 1100160, 'steps': 5729, 'loss/train': 1.1370854377746582} +11/06/2021 22:03:28 - INFO - __main__ - Step 5731: {'lr': 0.0004992167920287443, 'samples': 1100352, 'steps': 5730, 'loss/train': 1.7039726972579956} +11/06/2021 22:03:29 - INFO - __main__ - Step 5732: {'lr': 0.0004992163722413528, 'samples': 1100544, 'steps': 5731, 'loss/train': 1.9213690757751465} +11/06/2021 22:03:30 - INFO - __main__ - Step 5733: {'lr': 0.0004992159523416683, 'samples': 1100736, 'steps': 5732, 'loss/train': 1.352500081062317} +11/06/2021 22:03:30 - INFO - __main__ - Step 5734: {'lr': 0.000499215532329691, 'samples': 1100928, 'steps': 5733, 'loss/train': 2.3343346118927} +11/06/2021 22:03:30 - INFO - __main__ - Step 5735: {'lr': 0.000499215112205421, 'samples': 1101120, 'steps': 5734, 'loss/train': 2.6258137226104736} +11/06/2021 22:03:31 - INFO - __main__ - Step 5736: {'lr': 0.0004992146919688584, 'samples': 1101312, 'steps': 5735, 'loss/train': 2.2007718086242676} +11/06/2021 22:03:31 - INFO - __main__ - Step 5737: {'lr': 0.0004992142716200036, 'samples': 1101504, 'steps': 5736, 'loss/train': 1.8303169012069702} +11/06/2021 22:03:32 - INFO - __main__ - Step 5738: {'lr': 0.0004992138511588567, 'samples': 1101696, 'steps': 5737, 'loss/train': 1.5697263479232788} +11/06/2021 22:03:33 - INFO - __main__ - Step 5739: {'lr': 0.0004992134305854179, 'samples': 1101888, 'steps': 5738, 'loss/train': 1.949165940284729} +11/06/2021 22:03:33 - INFO - __main__ - Step 5740: {'lr': 0.0004992130098996873, 'samples': 1102080, 'steps': 5739, 'loss/train': 2.357881784439087} +11/06/2021 22:03:33 - INFO - __main__ - Step 5741: {'lr': 0.0004992125891016652, 'samples': 1102272, 'steps': 5740, 'loss/train': 2.1080918312072754} +11/06/2021 22:03:34 - INFO - __main__ - Step 5742: {'lr': 0.0004992121681913518, 'samples': 1102464, 'steps': 5741, 'loss/train': 1.897286295890808} +11/06/2021 22:03:35 - INFO - __main__ - Step 5743: {'lr': 0.0004992117471687472, 'samples': 1102656, 'steps': 5742, 'loss/train': 1.7857768535614014} +11/06/2021 22:03:35 - INFO - __main__ - Step 5744: {'lr': 0.0004992113260338517, 'samples': 1102848, 'steps': 5743, 'loss/train': 1.731091022491455} +11/06/2021 22:03:36 - INFO - __main__ - Step 5745: {'lr': 0.0004992109047866653, 'samples': 1103040, 'steps': 5744, 'loss/train': 0.806926429271698} +11/06/2021 22:03:36 - INFO - __main__ - Step 5746: {'lr': 0.0004992104834271884, 'samples': 1103232, 'steps': 5745, 'loss/train': 1.5223336219787598} +11/06/2021 22:03:36 - INFO - __main__ - Step 5747: {'lr': 0.0004992100619554211, 'samples': 1103424, 'steps': 5746, 'loss/train': 0.8918942809104919} +11/06/2021 22:03:37 - INFO - __main__ - Step 5748: {'lr': 0.0004992096403713635, 'samples': 1103616, 'steps': 5747, 'loss/train': 2.426661491394043} +11/06/2021 22:03:38 - INFO - __main__ - Step 5749: {'lr': 0.000499209218675016, 'samples': 1103808, 'steps': 5748, 'loss/train': 1.9452520608901978} +11/06/2021 22:03:38 - INFO - __main__ - Step 5750: {'lr': 0.0004992087968663786, 'samples': 1104000, 'steps': 5749, 'loss/train': 2.1779873371124268} +11/06/2021 22:03:38 - INFO - __main__ - Step 5751: {'lr': 0.0004992083749454515, 'samples': 1104192, 'steps': 5750, 'loss/train': 2.161979913711548} +11/06/2021 22:03:39 - INFO - __main__ - Step 5752: {'lr': 0.0004992079529122351, 'samples': 1104384, 'steps': 5751, 'loss/train': 2.0824427604675293} +11/06/2021 22:03:39 - INFO - __main__ - Step 5753: {'lr': 0.0004992075307667294, 'samples': 1104576, 'steps': 5752, 'loss/train': 1.917615532875061} +11/06/2021 22:03:40 - INFO - __main__ - Step 5754: {'lr': 0.0004992071085089346, 'samples': 1104768, 'steps': 5753, 'loss/train': 1.9957177639007568} +11/06/2021 22:03:40 - INFO - __main__ - Step 5755: {'lr': 0.0004992066861388509, 'samples': 1104960, 'steps': 5754, 'loss/train': 2.4890198707580566} +11/06/2021 22:03:41 - INFO - __main__ - Step 5756: {'lr': 0.0004992062636564786, 'samples': 1105152, 'steps': 5755, 'loss/train': 2.0366508960723877} +11/06/2021 22:03:41 - INFO - __main__ - Step 5757: {'lr': 0.0004992058410618177, 'samples': 1105344, 'steps': 5756, 'loss/train': 1.8771767616271973} +11/06/2021 22:03:41 - INFO - __main__ - Step 5758: {'lr': 0.0004992054183548685, 'samples': 1105536, 'steps': 5757, 'loss/train': 1.831110954284668} +11/06/2021 22:03:42 - INFO - __main__ - Step 5759: {'lr': 0.0004992049955356313, 'samples': 1105728, 'steps': 5758, 'loss/train': 1.9998888969421387} +11/06/2021 22:03:43 - INFO - __main__ - Step 5760: {'lr': 0.0004992045726041061, 'samples': 1105920, 'steps': 5759, 'loss/train': 1.6390290260314941} +11/06/2021 22:03:43 - INFO - __main__ - Step 5761: {'lr': 0.0004992041495602931, 'samples': 1106112, 'steps': 5760, 'loss/train': 1.8871279954910278} +11/06/2021 22:03:43 - INFO - __main__ - Step 5762: {'lr': 0.0004992037264041927, 'samples': 1106304, 'steps': 5761, 'loss/train': 2.7481179237365723} +11/06/2021 22:03:44 - INFO - __main__ - Step 5763: {'lr': 0.0004992033031358048, 'samples': 1106496, 'steps': 5762, 'loss/train': 2.292053699493408} +11/06/2021 22:03:45 - INFO - __main__ - Step 5764: {'lr': 0.0004992028797551298, 'samples': 1106688, 'steps': 5763, 'loss/train': 1.911152720451355} +11/06/2021 22:03:45 - INFO - __main__ - Step 5765: {'lr': 0.0004992024562621678, 'samples': 1106880, 'steps': 5764, 'loss/train': 2.004040479660034} +11/06/2021 22:03:46 - INFO - __main__ - Step 5766: {'lr': 0.0004992020326569191, 'samples': 1107072, 'steps': 5765, 'loss/train': 2.0469226837158203} +11/06/2021 22:03:46 - INFO - __main__ - Step 5767: {'lr': 0.0004992016089393837, 'samples': 1107264, 'steps': 5766, 'loss/train': 1.93135666847229} +11/06/2021 22:03:46 - INFO - __main__ - Step 5768: {'lr': 0.000499201185109562, 'samples': 1107456, 'steps': 5767, 'loss/train': 2.3704495429992676} +11/06/2021 22:03:47 - INFO - __main__ - Step 5769: {'lr': 0.000499200761167454, 'samples': 1107648, 'steps': 5768, 'loss/train': 1.7773163318634033} +11/06/2021 22:03:48 - INFO - __main__ - Step 5770: {'lr': 0.0004992003371130601, 'samples': 1107840, 'steps': 5769, 'loss/train': 1.401180386543274} +11/06/2021 22:03:48 - INFO - __main__ - Step 5771: {'lr': 0.0004991999129463803, 'samples': 1108032, 'steps': 5770, 'loss/train': 2.0761475563049316} +11/06/2021 22:03:48 - INFO - __main__ - Step 5772: {'lr': 0.0004991994886674148, 'samples': 1108224, 'steps': 5771, 'loss/train': 2.294243574142456} +11/06/2021 22:03:49 - INFO - __main__ - Step 5773: {'lr': 0.000499199064276164, 'samples': 1108416, 'steps': 5772, 'loss/train': 2.8149049282073975} +11/06/2021 22:03:50 - INFO - __main__ - Step 5774: {'lr': 0.0004991986397726278, 'samples': 1108608, 'steps': 5773, 'loss/train': 1.9633965492248535} +11/06/2021 22:03:50 - INFO - __main__ - Step 5775: {'lr': 0.0004991982151568066, 'samples': 1108800, 'steps': 5774, 'loss/train': 2.1700239181518555} +11/06/2021 22:03:50 - INFO - __main__ - Step 5776: {'lr': 0.0004991977904287006, 'samples': 1108992, 'steps': 5775, 'loss/train': 1.5528236627578735} +11/06/2021 22:03:51 - INFO - __main__ - Step 5777: {'lr': 0.0004991973655883099, 'samples': 1109184, 'steps': 5776, 'loss/train': 1.8211041688919067} +11/06/2021 22:03:51 - INFO - __main__ - Step 5778: {'lr': 0.0004991969406356346, 'samples': 1109376, 'steps': 5777, 'loss/train': 2.413984775543213} +11/06/2021 22:03:51 - INFO - __main__ - Step 5779: {'lr': 0.0004991965155706752, 'samples': 1109568, 'steps': 5778, 'loss/train': 1.5177364349365234} +11/06/2021 22:03:52 - INFO - __main__ - Step 5780: {'lr': 0.0004991960903934315, 'samples': 1109760, 'steps': 5779, 'loss/train': 1.6337430477142334} +11/06/2021 22:03:53 - INFO - __main__ - Step 5781: {'lr': 0.0004991956651039039, 'samples': 1109952, 'steps': 5780, 'loss/train': 1.6799068450927734} +11/06/2021 22:03:53 - INFO - __main__ - Step 5782: {'lr': 0.0004991952397020927, 'samples': 1110144, 'steps': 5781, 'loss/train': 1.9769641160964966} +11/06/2021 22:03:54 - INFO - __main__ - Step 5783: {'lr': 0.0004991948141879978, 'samples': 1110336, 'steps': 5782, 'loss/train': 1.8195029497146606} +11/06/2021 22:03:54 - INFO - __main__ - Step 5784: {'lr': 0.0004991943885616198, 'samples': 1110528, 'steps': 5783, 'loss/train': 1.771957516670227} +11/06/2021 22:03:55 - INFO - __main__ - Step 5785: {'lr': 0.0004991939628229585, 'samples': 1110720, 'steps': 5784, 'loss/train': 1.7779532670974731} +11/06/2021 22:03:55 - INFO - __main__ - Step 5786: {'lr': 0.0004991935369720143, 'samples': 1110912, 'steps': 5785, 'loss/train': 2.5987279415130615} +11/06/2021 22:03:56 - INFO - __main__ - Step 5787: {'lr': 0.0004991931110087873, 'samples': 1111104, 'steps': 5786, 'loss/train': 2.056739568710327} +11/06/2021 22:03:56 - INFO - __main__ - Step 5788: {'lr': 0.0004991926849332777, 'samples': 1111296, 'steps': 5787, 'loss/train': 2.098029851913452} +11/06/2021 22:03:56 - INFO - __main__ - Step 5789: {'lr': 0.0004991922587454858, 'samples': 1111488, 'steps': 5788, 'loss/train': 1.8450032472610474} +11/06/2021 22:03:57 - INFO - __main__ - Step 5790: {'lr': 0.0004991918324454117, 'samples': 1111680, 'steps': 5789, 'loss/train': 1.8697025775909424} +11/06/2021 22:03:58 - INFO - __main__ - Step 5791: {'lr': 0.0004991914060330556, 'samples': 1111872, 'steps': 5790, 'loss/train': 2.107398271560669} +11/06/2021 22:03:58 - INFO - __main__ - Step 5792: {'lr': 0.0004991909795084177, 'samples': 1112064, 'steps': 5791, 'loss/train': 1.6011704206466675} +11/06/2021 22:03:58 - INFO - __main__ - Step 5793: {'lr': 0.0004991905528714981, 'samples': 1112256, 'steps': 5792, 'loss/train': 1.8442002534866333} +11/06/2021 22:03:59 - INFO - __main__ - Step 5794: {'lr': 0.0004991901261222971, 'samples': 1112448, 'steps': 5793, 'loss/train': 2.1112143993377686} +11/06/2021 22:04:00 - INFO - __main__ - Step 5795: {'lr': 0.000499189699260815, 'samples': 1112640, 'steps': 5794, 'loss/train': 1.3628276586532593} +11/06/2021 22:04:00 - INFO - __main__ - Step 5796: {'lr': 0.0004991892722870517, 'samples': 1112832, 'steps': 5795, 'loss/train': 1.7392164468765259} +11/06/2021 22:04:00 - INFO - __main__ - Step 5797: {'lr': 0.0004991888452010076, 'samples': 1113024, 'steps': 5796, 'loss/train': 2.1500654220581055} +11/06/2021 22:04:01 - INFO - __main__ - Step 5798: {'lr': 0.000499188418002683, 'samples': 1113216, 'steps': 5797, 'loss/train': 2.0395941734313965} +11/06/2021 22:04:01 - INFO - __main__ - Step 5799: {'lr': 0.0004991879906920779, 'samples': 1113408, 'steps': 5798, 'loss/train': 1.4463250637054443} +11/06/2021 22:04:02 - INFO - __main__ - Step 5800: {'lr': 0.0004991875632691924, 'samples': 1113600, 'steps': 5799, 'loss/train': 2.434201717376709} +11/06/2021 22:04:02 - INFO - __main__ - Step 5801: {'lr': 0.0004991871357340269, 'samples': 1113792, 'steps': 5800, 'loss/train': 2.0661230087280273} +11/06/2021 22:04:03 - INFO - __main__ - Step 5802: {'lr': 0.0004991867080865815, 'samples': 1113984, 'steps': 5801, 'loss/train': 2.2368245124816895} +11/06/2021 22:04:03 - INFO - __main__ - Step 5803: {'lr': 0.0004991862803268564, 'samples': 1114176, 'steps': 5802, 'loss/train': 2.107743501663208} +11/06/2021 22:04:03 - INFO - __main__ - Step 5804: {'lr': 0.0004991858524548519, 'samples': 1114368, 'steps': 5803, 'loss/train': 1.269503116607666} +11/06/2021 22:04:05 - INFO - __main__ - Step 5805: {'lr': 0.000499185424470568, 'samples': 1114560, 'steps': 5804, 'loss/train': 1.8158258199691772} +11/06/2021 22:04:05 - INFO - __main__ - Step 5806: {'lr': 0.0004991849963740052, 'samples': 1114752, 'steps': 5805, 'loss/train': 1.9110217094421387} +11/06/2021 22:04:06 - INFO - __main__ - Step 5807: {'lr': 0.0004991845681651632, 'samples': 1114944, 'steps': 5806, 'loss/train': 1.8827478885650635} +11/06/2021 22:04:06 - INFO - __main__ - Step 5808: {'lr': 0.0004991841398440427, 'samples': 1115136, 'steps': 5807, 'loss/train': 1.9933255910873413} +11/06/2021 22:04:06 - INFO - __main__ - Step 5809: {'lr': 0.0004991837114106436, 'samples': 1115328, 'steps': 5808, 'loss/train': 2.1655633449554443} +11/06/2021 22:04:07 - INFO - __main__ - Step 5810: {'lr': 0.0004991832828649661, 'samples': 1115520, 'steps': 5809, 'loss/train': 1.6817560195922852} +11/06/2021 22:04:08 - INFO - __main__ - Step 5811: {'lr': 0.0004991828542070105, 'samples': 1115712, 'steps': 5810, 'loss/train': 0.6421383023262024} +11/06/2021 22:04:08 - INFO - __main__ - Step 5812: {'lr': 0.000499182425436777, 'samples': 1115904, 'steps': 5811, 'loss/train': 1.786048173904419} +11/06/2021 22:04:08 - INFO - __main__ - Step 5813: {'lr': 0.0004991819965542657, 'samples': 1116096, 'steps': 5812, 'loss/train': 1.7168254852294922} +11/06/2021 22:04:09 - INFO - __main__ - Step 5814: {'lr': 0.0004991815675594768, 'samples': 1116288, 'steps': 5813, 'loss/train': 1.5646218061447144} +11/06/2021 22:04:09 - INFO - __main__ - Step 5815: {'lr': 0.0004991811384524106, 'samples': 1116480, 'steps': 5814, 'loss/train': 1.233889102935791} +11/06/2021 22:04:10 - INFO - __main__ - Step 5816: {'lr': 0.0004991807092330671, 'samples': 1116672, 'steps': 5815, 'loss/train': 1.7671700716018677} +11/06/2021 22:04:10 - INFO - __main__ - Step 5817: {'lr': 0.0004991802799014467, 'samples': 1116864, 'steps': 5816, 'loss/train': 2.299095630645752} +11/06/2021 22:04:11 - INFO - __main__ - Step 5818: {'lr': 0.0004991798504575495, 'samples': 1117056, 'steps': 5817, 'loss/train': 1.8498998880386353} +11/06/2021 22:04:11 - INFO - __main__ - Step 5819: {'lr': 0.0004991794209013758, 'samples': 1117248, 'steps': 5818, 'loss/train': 1.8572213649749756} +11/06/2021 22:04:11 - INFO - __main__ - Step 5820: {'lr': 0.0004991789912329257, 'samples': 1117440, 'steps': 5819, 'loss/train': 0.8670408725738525} +11/06/2021 22:04:12 - INFO - __main__ - Step 5821: {'lr': 0.0004991785614521993, 'samples': 1117632, 'steps': 5820, 'loss/train': 3.0006051063537598} +11/06/2021 22:04:13 - INFO - __main__ - Step 5822: {'lr': 0.0004991781315591969, 'samples': 1117824, 'steps': 5821, 'loss/train': 2.1679015159606934} +11/06/2021 22:04:13 - INFO - __main__ - Step 5823: {'lr': 0.0004991777015539186, 'samples': 1118016, 'steps': 5822, 'loss/train': 2.232862710952759} +11/06/2021 22:04:13 - INFO - __main__ - Step 5824: {'lr': 0.0004991772714363649, 'samples': 1118208, 'steps': 5823, 'loss/train': 1.790226936340332} +11/06/2021 22:04:14 - INFO - __main__ - Step 5825: {'lr': 0.0004991768412065355, 'samples': 1118400, 'steps': 5824, 'loss/train': 1.278944492340088} +11/06/2021 22:04:15 - INFO - __main__ - Step 5826: {'lr': 0.000499176410864431, 'samples': 1118592, 'steps': 5825, 'loss/train': 1.5651650428771973} +11/06/2021 22:04:15 - INFO - __main__ - Step 5827: {'lr': 0.0004991759804100515, 'samples': 1118784, 'steps': 5826, 'loss/train': 1.8785316944122314} +11/06/2021 22:04:16 - INFO - __main__ - Step 5828: {'lr': 0.000499175549843397, 'samples': 1118976, 'steps': 5827, 'loss/train': 2.057476282119751} +11/06/2021 22:04:16 - INFO - __main__ - Step 5829: {'lr': 0.0004991751191644679, 'samples': 1119168, 'steps': 5828, 'loss/train': 2.047145366668701} +11/06/2021 22:04:16 - INFO - __main__ - Step 5830: {'lr': 0.0004991746883732644, 'samples': 1119360, 'steps': 5829, 'loss/train': 1.9324302673339844} +11/06/2021 22:04:17 - INFO - __main__ - Step 5831: {'lr': 0.0004991742574697866, 'samples': 1119552, 'steps': 5830, 'loss/train': 1.9625569581985474} +11/06/2021 22:04:18 - INFO - __main__ - Step 5832: {'lr': 0.0004991738264540347, 'samples': 1119744, 'steps': 5831, 'loss/train': 2.0301690101623535} +11/06/2021 22:04:18 - INFO - __main__ - Step 5833: {'lr': 0.0004991733953260089, 'samples': 1119936, 'steps': 5832, 'loss/train': 2.2081518173217773} +11/06/2021 22:04:18 - INFO - __main__ - Step 5834: {'lr': 0.0004991729640857095, 'samples': 1120128, 'steps': 5833, 'loss/train': 1.706737756729126} +11/06/2021 22:04:19 - INFO - __main__ - Step 5835: {'lr': 0.0004991725327331366, 'samples': 1120320, 'steps': 5834, 'loss/train': 1.6535284519195557} +11/06/2021 22:04:19 - INFO - __main__ - Step 5836: {'lr': 0.0004991721012682903, 'samples': 1120512, 'steps': 5835, 'loss/train': 1.5109832286834717} +11/06/2021 22:04:20 - INFO - __main__ - Step 5837: {'lr': 0.0004991716696911709, 'samples': 1120704, 'steps': 5836, 'loss/train': 1.7255332469940186} +11/06/2021 22:04:21 - INFO - __main__ - Step 5838: {'lr': 0.0004991712380017786, 'samples': 1120896, 'steps': 5837, 'loss/train': 2.3126747608184814} +11/06/2021 22:04:21 - INFO - __main__ - Step 5839: {'lr': 0.0004991708062001137, 'samples': 1121088, 'steps': 5838, 'loss/train': 1.5363658666610718} +11/06/2021 22:04:22 - INFO - __main__ - Step 5840: {'lr': 0.0004991703742861762, 'samples': 1121280, 'steps': 5839, 'loss/train': 2.014793872833252} +11/06/2021 22:04:22 - INFO - __main__ - Step 5841: {'lr': 0.0004991699422599664, 'samples': 1121472, 'steps': 5840, 'loss/train': 5.858007907867432} +11/06/2021 22:04:22 - INFO - __main__ - Step 5842: {'lr': 0.0004991695101214844, 'samples': 1121664, 'steps': 5841, 'loss/train': 6.085140228271484} +11/06/2021 22:04:23 - INFO - __main__ - Step 5843: {'lr': 0.0004991690778707305, 'samples': 1121856, 'steps': 5842, 'loss/train': 1.8172892332077026} +11/06/2021 22:04:24 - INFO - __main__ - Step 5844: {'lr': 0.0004991686455077049, 'samples': 1122048, 'steps': 5843, 'loss/train': 2.0172688961029053} +11/06/2021 22:04:24 - INFO - __main__ - Step 5845: {'lr': 0.0004991682130324078, 'samples': 1122240, 'steps': 5844, 'loss/train': 1.5611968040466309} +11/06/2021 22:04:24 - INFO - __main__ - Step 5846: {'lr': 0.0004991677804448392, 'samples': 1122432, 'steps': 5845, 'loss/train': 2.0921804904937744} +11/06/2021 22:04:25 - INFO - __main__ - Step 5847: {'lr': 0.0004991673477449995, 'samples': 1122624, 'steps': 5846, 'loss/train': 1.8288406133651733} +11/06/2021 22:04:25 - INFO - __main__ - Step 5848: {'lr': 0.0004991669149328889, 'samples': 1122816, 'steps': 5847, 'loss/train': 1.8865562677383423} +11/06/2021 22:04:26 - INFO - __main__ - Step 5849: {'lr': 0.0004991664820085074, 'samples': 1123008, 'steps': 5848, 'loss/train': 2.1795449256896973} +11/06/2021 22:04:27 - INFO - __main__ - Step 5850: {'lr': 0.0004991660489718554, 'samples': 1123200, 'steps': 5849, 'loss/train': 1.6964969635009766} +11/06/2021 22:04:27 - INFO - __main__ - Step 5851: {'lr': 0.0004991656158229331, 'samples': 1123392, 'steps': 5850, 'loss/train': 1.9025615453720093} +11/06/2021 22:04:27 - INFO - __main__ - Step 5852: {'lr': 0.0004991651825617406, 'samples': 1123584, 'steps': 5851, 'loss/train': 2.156768560409546} +11/06/2021 22:04:28 - INFO - __main__ - Step 5853: {'lr': 0.000499164749188278, 'samples': 1123776, 'steps': 5852, 'loss/train': 2.2558553218841553} +11/06/2021 22:04:29 - INFO - __main__ - Step 5854: {'lr': 0.0004991643157025458, 'samples': 1123968, 'steps': 5853, 'loss/train': 1.9887200593948364} +11/06/2021 22:04:29 - INFO - __main__ - Step 5855: {'lr': 0.0004991638821045439, 'samples': 1124160, 'steps': 5854, 'loss/train': 2.0848309993743896} +11/06/2021 22:04:29 - INFO - __main__ - Step 5856: {'lr': 0.0004991634483942725, 'samples': 1124352, 'steps': 5855, 'loss/train': 1.9906128644943237} +11/06/2021 22:04:30 - INFO - __main__ - Step 5857: {'lr': 0.000499163014571732, 'samples': 1124544, 'steps': 5856, 'loss/train': 1.9705578088760376} +11/06/2021 22:04:30 - INFO - __main__ - Step 5858: {'lr': 0.0004991625806369225, 'samples': 1124736, 'steps': 5857, 'loss/train': 1.9932202100753784} +11/06/2021 22:04:32 - INFO - __main__ - Step 5859: {'lr': 0.0004991621465898441, 'samples': 1124928, 'steps': 5858, 'loss/train': 1.7375214099884033} +11/06/2021 22:04:32 - INFO - __main__ - Step 5860: {'lr': 0.0004991617124304971, 'samples': 1125120, 'steps': 5859, 'loss/train': 1.9731206893920898} +11/06/2021 22:04:32 - INFO - __main__ - Step 5861: {'lr': 0.0004991612781588818, 'samples': 1125312, 'steps': 5860, 'loss/train': 0.45900076627731323} +11/06/2021 22:04:33 - INFO - __main__ - Step 5862: {'lr': 0.0004991608437749981, 'samples': 1125504, 'steps': 5861, 'loss/train': 2.0371387004852295} +11/06/2021 22:04:33 - INFO - __main__ - Step 5863: {'lr': 0.0004991604092788465, 'samples': 1125696, 'steps': 5862, 'loss/train': 3.404467821121216} +11/06/2021 22:04:33 - INFO - __main__ - Step 5864: {'lr': 0.000499159974670427, 'samples': 1125888, 'steps': 5863, 'loss/train': 1.9706652164459229} +11/06/2021 22:04:34 - INFO - __main__ - Step 5865: {'lr': 0.00049915953994974, 'samples': 1126080, 'steps': 5864, 'loss/train': 1.71634042263031} +11/06/2021 22:04:35 - INFO - __main__ - Step 5866: {'lr': 0.0004991591051167853, 'samples': 1126272, 'steps': 5865, 'loss/train': 2.338533401489258} +11/06/2021 22:04:35 - INFO - __main__ - Step 5867: {'lr': 0.0004991586701715635, 'samples': 1126464, 'steps': 5866, 'loss/train': 0.339321494102478} +11/06/2021 22:04:36 - INFO - __main__ - Step 5868: {'lr': 0.0004991582351140747, 'samples': 1126656, 'steps': 5867, 'loss/train': 1.8088363409042358} +11/06/2021 22:04:36 - INFO - __main__ - Step 5869: {'lr': 0.000499157799944319, 'samples': 1126848, 'steps': 5868, 'loss/train': 1.787323236465454} +11/06/2021 22:04:36 - INFO - __main__ - Step 5870: {'lr': 0.0004991573646622965, 'samples': 1127040, 'steps': 5869, 'loss/train': 1.9397883415222168} +11/06/2021 22:04:37 - INFO - __main__ - Step 5871: {'lr': 0.0004991569292680078, 'samples': 1127232, 'steps': 5870, 'loss/train': 0.43821990489959717} +11/06/2021 22:04:38 - INFO - __main__ - Step 5872: {'lr': 0.0004991564937614526, 'samples': 1127424, 'steps': 5871, 'loss/train': 2.1050267219543457} +11/06/2021 22:04:38 - INFO - __main__ - Step 5873: {'lr': 0.0004991560581426314, 'samples': 1127616, 'steps': 5872, 'loss/train': 2.0710291862487793} +11/06/2021 22:04:38 - INFO - __main__ - Step 5874: {'lr': 0.0004991556224115444, 'samples': 1127808, 'steps': 5873, 'loss/train': 2.220693349838257} +11/06/2021 22:04:39 - INFO - __main__ - Step 5875: {'lr': 0.0004991551865681916, 'samples': 1128000, 'steps': 5874, 'loss/train': 1.8416770696640015} +11/06/2021 22:04:40 - INFO - __main__ - Step 5876: {'lr': 0.0004991547506125734, 'samples': 1128192, 'steps': 5875, 'loss/train': 2.190176248550415} +11/06/2021 22:04:40 - INFO - __main__ - Step 5877: {'lr': 0.0004991543145446899, 'samples': 1128384, 'steps': 5876, 'loss/train': 1.174869418144226} +11/06/2021 22:04:40 - INFO - __main__ - Step 5878: {'lr': 0.0004991538783645413, 'samples': 1128576, 'steps': 5877, 'loss/train': 2.180773973464966} +11/06/2021 22:04:41 - INFO - __main__ - Step 5879: {'lr': 0.0004991534420721278, 'samples': 1128768, 'steps': 5878, 'loss/train': 1.775754451751709} +11/06/2021 22:04:41 - INFO - __main__ - Step 5880: {'lr': 0.0004991530056674496, 'samples': 1128960, 'steps': 5879, 'loss/train': 1.8799948692321777} +11/06/2021 22:04:42 - INFO - __main__ - Step 5881: {'lr': 0.000499152569150507, 'samples': 1129152, 'steps': 5880, 'loss/train': 2.05820894241333} +11/06/2021 22:04:43 - INFO - __main__ - Step 5882: {'lr': 0.0004991521325213, 'samples': 1129344, 'steps': 5881, 'loss/train': 1.8497810363769531} +11/06/2021 22:04:43 - INFO - __main__ - Step 5883: {'lr': 0.0004991516957798289, 'samples': 1129536, 'steps': 5882, 'loss/train': 2.388411521911621} +11/06/2021 22:04:43 - INFO - __main__ - Step 5884: {'lr': 0.0004991512589260939, 'samples': 1129728, 'steps': 5883, 'loss/train': 2.0570759773254395} +11/06/2021 22:04:44 - INFO - __main__ - Step 5885: {'lr': 0.0004991508219600952, 'samples': 1129920, 'steps': 5884, 'loss/train': 2.236051321029663} +11/06/2021 22:04:45 - INFO - __main__ - Step 5886: {'lr': 0.000499150384881833, 'samples': 1130112, 'steps': 5885, 'loss/train': 1.3894482851028442} +11/06/2021 22:04:45 - INFO - __main__ - Step 5887: {'lr': 0.0004991499476913074, 'samples': 1130304, 'steps': 5886, 'loss/train': 1.8141835927963257} +11/06/2021 22:04:45 - INFO - __main__ - Step 5888: {'lr': 0.0004991495103885187, 'samples': 1130496, 'steps': 5887, 'loss/train': 1.7120885848999023} +11/06/2021 22:04:46 - INFO - __main__ - Step 5889: {'lr': 0.0004991490729734672, 'samples': 1130688, 'steps': 5888, 'loss/train': 1.4462894201278687} +11/06/2021 22:04:46 - INFO - __main__ - Step 5890: {'lr': 0.0004991486354461528, 'samples': 1130880, 'steps': 5889, 'loss/train': 2.2380330562591553} +11/06/2021 22:04:46 - INFO - __main__ - Step 5891: {'lr': 0.000499148197806576, 'samples': 1131072, 'steps': 5890, 'loss/train': 1.384273648262024} +11/06/2021 22:04:47 - INFO - __main__ - Step 5892: {'lr': 0.0004991477600547367, 'samples': 1131264, 'steps': 5891, 'loss/train': 1.8132703304290771} +11/06/2021 22:04:48 - INFO - __main__ - Step 5893: {'lr': 0.0004991473221906354, 'samples': 1131456, 'steps': 5892, 'loss/train': 2.0042428970336914} +11/06/2021 22:04:48 - INFO - __main__ - Step 5894: {'lr': 0.0004991468842142722, 'samples': 1131648, 'steps': 5893, 'loss/train': 2.088541030883789} +11/06/2021 22:04:48 - INFO - __main__ - Step 5895: {'lr': 0.0004991464461256472, 'samples': 1131840, 'steps': 5894, 'loss/train': 1.8709157705307007} +11/06/2021 22:04:49 - INFO - __main__ - Step 5896: {'lr': 0.0004991460079247606, 'samples': 1132032, 'steps': 5895, 'loss/train': 1.9683117866516113} +11/06/2021 22:04:50 - INFO - __main__ - Step 5897: {'lr': 0.0004991455696116128, 'samples': 1132224, 'steps': 5896, 'loss/train': 1.7423728704452515} +11/06/2021 22:04:50 - INFO - __main__ - Step 5898: {'lr': 0.0004991451311862037, 'samples': 1132416, 'steps': 5897, 'loss/train': 1.5214271545410156} +11/06/2021 22:04:50 - INFO - __main__ - Step 5899: {'lr': 0.0004991446926485337, 'samples': 1132608, 'steps': 5898, 'loss/train': 1.8397377729415894} +11/06/2021 22:04:51 - INFO - __main__ - Step 5900: {'lr': 0.0004991442539986029, 'samples': 1132800, 'steps': 5899, 'loss/train': 2.119931697845459} +11/06/2021 22:04:51 - INFO - __main__ - Step 5901: {'lr': 0.0004991438152364117, 'samples': 1132992, 'steps': 5900, 'loss/train': 1.960817813873291} +11/06/2021 22:04:52 - INFO - __main__ - Step 5902: {'lr': 0.0004991433763619599, 'samples': 1133184, 'steps': 5901, 'loss/train': 1.7662793397903442} +11/06/2021 22:04:52 - INFO - __main__ - Step 5903: {'lr': 0.0004991429373752482, 'samples': 1133376, 'steps': 5902, 'loss/train': 1.5504059791564941} +11/06/2021 22:04:53 - INFO - __main__ - Step 5904: {'lr': 0.0004991424982762763, 'samples': 1133568, 'steps': 5903, 'loss/train': 2.349090576171875} +11/06/2021 22:04:53 - INFO - __main__ - Step 5905: {'lr': 0.0004991420590650448, 'samples': 1133760, 'steps': 5904, 'loss/train': 1.9303275346755981} +11/06/2021 22:04:54 - INFO - __main__ - Step 5906: {'lr': 0.0004991416197415537, 'samples': 1133952, 'steps': 5905, 'loss/train': 1.6415051221847534} +11/06/2021 22:04:55 - INFO - __main__ - Step 5907: {'lr': 0.0004991411803058032, 'samples': 1134144, 'steps': 5906, 'loss/train': 1.6599597930908203} +11/06/2021 22:04:55 - INFO - __main__ - Step 5908: {'lr': 0.0004991407407577936, 'samples': 1134336, 'steps': 5907, 'loss/train': 1.926432728767395} +11/06/2021 22:04:55 - INFO - __main__ - Step 5909: {'lr': 0.0004991403010975249, 'samples': 1134528, 'steps': 5908, 'loss/train': 1.6873294115066528} +11/06/2021 22:04:56 - INFO - __main__ - Step 5910: {'lr': 0.0004991398613249976, 'samples': 1134720, 'steps': 5909, 'loss/train': 2.0104522705078125} +11/06/2021 22:04:56 - INFO - __main__ - Step 5911: {'lr': 0.0004991394214402115, 'samples': 1134912, 'steps': 5910, 'loss/train': 1.2183507680892944} +11/06/2021 22:04:57 - INFO - __main__ - Step 5912: {'lr': 0.0004991389814431672, 'samples': 1135104, 'steps': 5911, 'loss/train': 2.336418390274048} +11/06/2021 22:04:57 - INFO - __main__ - Step 5913: {'lr': 0.0004991385413338646, 'samples': 1135296, 'steps': 5912, 'loss/train': 1.6936346292495728} +11/06/2021 22:04:58 - INFO - __main__ - Step 5914: {'lr': 0.0004991381011123041, 'samples': 1135488, 'steps': 5913, 'loss/train': 1.936176061630249} +11/06/2021 22:04:58 - INFO - __main__ - Step 5915: {'lr': 0.0004991376607784857, 'samples': 1135680, 'steps': 5914, 'loss/train': 2.222874402999878} +11/06/2021 22:04:58 - INFO - __main__ - Step 5916: {'lr': 0.0004991372203324098, 'samples': 1135872, 'steps': 5915, 'loss/train': 1.72451913356781} +11/06/2021 22:04:59 - INFO - __main__ - Step 5917: {'lr': 0.0004991367797740765, 'samples': 1136064, 'steps': 5916, 'loss/train': 2.277719736099243} +11/06/2021 22:05:00 - INFO - __main__ - Step 5918: {'lr': 0.0004991363391034861, 'samples': 1136256, 'steps': 5917, 'loss/train': 1.82767915725708} +11/06/2021 22:05:00 - INFO - __main__ - Step 5919: {'lr': 0.0004991358983206386, 'samples': 1136448, 'steps': 5918, 'loss/train': 1.7569984197616577} +11/06/2021 22:05:00 - INFO - __main__ - Step 5920: {'lr': 0.0004991354574255344, 'samples': 1136640, 'steps': 5919, 'loss/train': 1.7401177883148193} +11/06/2021 22:05:01 - INFO - __main__ - Step 5921: {'lr': 0.0004991350164181735, 'samples': 1136832, 'steps': 5920, 'loss/train': 1.826175332069397} +11/06/2021 22:05:02 - INFO - __main__ - Step 5922: {'lr': 0.0004991345752985563, 'samples': 1137024, 'steps': 5921, 'loss/train': 1.4562937021255493} +11/06/2021 22:05:02 - INFO - __main__ - Step 5923: {'lr': 0.0004991341340666828, 'samples': 1137216, 'steps': 5922, 'loss/train': 2.3827600479125977} +11/06/2021 22:05:03 - INFO - __main__ - Step 5924: {'lr': 0.0004991336927225534, 'samples': 1137408, 'steps': 5923, 'loss/train': 1.9076972007751465} +11/06/2021 22:05:03 - INFO - __main__ - Step 5925: {'lr': 0.0004991332512661682, 'samples': 1137600, 'steps': 5924, 'loss/train': 1.9979768991470337} +11/06/2021 22:05:03 - INFO - __main__ - Step 5926: {'lr': 0.0004991328096975273, 'samples': 1137792, 'steps': 5925, 'loss/train': 2.118201971054077} +11/06/2021 22:05:04 - INFO - __main__ - Step 5927: {'lr': 0.0004991323680166312, 'samples': 1137984, 'steps': 5926, 'loss/train': 2.161531925201416} +11/06/2021 22:05:05 - INFO - __main__ - Step 5928: {'lr': 0.0004991319262234797, 'samples': 1138176, 'steps': 5927, 'loss/train': 1.8950947523117065} +11/06/2021 22:05:05 - INFO - __main__ - Step 5929: {'lr': 0.0004991314843180733, 'samples': 1138368, 'steps': 5928, 'loss/train': 1.211108684539795} +11/06/2021 22:05:05 - INFO - __main__ - Step 5930: {'lr': 0.0004991310423004121, 'samples': 1138560, 'steps': 5929, 'loss/train': 2.195322275161743} +11/06/2021 22:05:06 - INFO - __main__ - Step 5931: {'lr': 0.0004991306001704962, 'samples': 1138752, 'steps': 5930, 'loss/train': 2.2083332538604736} +11/06/2021 22:05:06 - INFO - __main__ - Step 5932: {'lr': 0.000499130157928326, 'samples': 1138944, 'steps': 5931, 'loss/train': 1.8265712261199951} +11/06/2021 22:05:07 - INFO - __main__ - Step 5933: {'lr': 0.0004991297155739015, 'samples': 1139136, 'steps': 5932, 'loss/train': 2.3104774951934814} +11/06/2021 22:05:08 - INFO - __main__ - Step 5934: {'lr': 0.0004991292731072231, 'samples': 1139328, 'steps': 5933, 'loss/train': 1.6424787044525146} +11/06/2021 22:05:08 - INFO - __main__ - Step 5935: {'lr': 0.0004991288305282908, 'samples': 1139520, 'steps': 5934, 'loss/train': 1.7371667623519897} +11/06/2021 22:05:08 - INFO - __main__ - Step 5936: {'lr': 0.0004991283878371049, 'samples': 1139712, 'steps': 5935, 'loss/train': 2.0819458961486816} +11/06/2021 22:05:09 - INFO - __main__ - Step 5937: {'lr': 0.0004991279450336656, 'samples': 1139904, 'steps': 5936, 'loss/train': 2.049226999282837} +11/06/2021 22:05:09 - INFO - __main__ - Step 5938: {'lr': 0.0004991275021179732, 'samples': 1140096, 'steps': 5937, 'loss/train': 1.6424188613891602} +11/06/2021 22:05:10 - INFO - __main__ - Step 5939: {'lr': 0.0004991270590900277, 'samples': 1140288, 'steps': 5938, 'loss/train': 2.0688111782073975} +11/06/2021 22:05:11 - INFO - __main__ - Step 5940: {'lr': 0.0004991266159498294, 'samples': 1140480, 'steps': 5939, 'loss/train': 1.3544045686721802} +11/06/2021 22:05:11 - INFO - __main__ - Step 5941: {'lr': 0.0004991261726973784, 'samples': 1140672, 'steps': 5940, 'loss/train': 2.6650118827819824} +11/06/2021 22:05:11 - INFO - __main__ - Step 5942: {'lr': 0.0004991257293326752, 'samples': 1140864, 'steps': 5941, 'loss/train': 1.340391993522644} +11/06/2021 22:05:12 - INFO - __main__ - Step 5943: {'lr': 0.0004991252858557196, 'samples': 1141056, 'steps': 5942, 'loss/train': 1.737450122833252} +11/06/2021 22:05:12 - INFO - __main__ - Step 5944: {'lr': 0.0004991248422665122, 'samples': 1141248, 'steps': 5943, 'loss/train': 2.2285938262939453} +11/06/2021 22:05:13 - INFO - __main__ - Step 5945: {'lr': 0.0004991243985650528, 'samples': 1141440, 'steps': 5944, 'loss/train': 2.2643086910247803} +11/06/2021 22:05:13 - INFO - __main__ - Step 5946: {'lr': 0.0004991239547513419, 'samples': 1141632, 'steps': 5945, 'loss/train': 1.9071139097213745} +11/06/2021 22:05:14 - INFO - __main__ - Step 5947: {'lr': 0.0004991235108253795, 'samples': 1141824, 'steps': 5946, 'loss/train': 1.679957628250122} +11/06/2021 22:05:14 - INFO - __main__ - Step 5948: {'lr': 0.0004991230667871659, 'samples': 1142016, 'steps': 5947, 'loss/train': 0.8383622765541077} +11/06/2021 22:05:16 - INFO - __main__ - Step 5949: {'lr': 0.0004991226226367013, 'samples': 1142208, 'steps': 5948, 'loss/train': 1.7677212953567505} +11/06/2021 22:05:16 - INFO - __main__ - Step 5950: {'lr': 0.0004991221783739859, 'samples': 1142400, 'steps': 5949, 'loss/train': 2.1849448680877686} +11/06/2021 22:05:16 - INFO - __main__ - Step 5951: {'lr': 0.0004991217339990199, 'samples': 1142592, 'steps': 5950, 'loss/train': 1.8535935878753662} +11/06/2021 22:05:17 - INFO - __main__ - Step 5952: {'lr': 0.0004991212895118035, 'samples': 1142784, 'steps': 5951, 'loss/train': 2.292984962463379} +11/06/2021 22:05:17 - INFO - __main__ - Step 5953: {'lr': 0.0004991208449123369, 'samples': 1142976, 'steps': 5952, 'loss/train': 2.318779468536377} +11/06/2021 22:05:17 - INFO - __main__ - Step 5954: {'lr': 0.0004991204002006203, 'samples': 1143168, 'steps': 5953, 'loss/train': 2.651663064956665} +11/06/2021 22:05:18 - INFO - __main__ - Step 5955: {'lr': 0.0004991199553766538, 'samples': 1143360, 'steps': 5954, 'loss/train': 2.468550205230713} +11/06/2021 22:05:19 - INFO - __main__ - Step 5956: {'lr': 0.0004991195104404378, 'samples': 1143552, 'steps': 5955, 'loss/train': 1.74437415599823} +11/06/2021 22:05:19 - INFO - __main__ - Step 5957: {'lr': 0.0004991190653919723, 'samples': 1143744, 'steps': 5956, 'loss/train': 1.5060465335845947} +11/06/2021 22:05:19 - INFO - __main__ - Step 5958: {'lr': 0.0004991186202312576, 'samples': 1143936, 'steps': 5957, 'loss/train': 2.46972393989563} +11/06/2021 22:05:20 - INFO - __main__ - Step 5959: {'lr': 0.0004991181749582941, 'samples': 1144128, 'steps': 5958, 'loss/train': 1.874528408050537} +11/06/2021 22:05:20 - INFO - __main__ - Step 5960: {'lr': 0.0004991177295730815, 'samples': 1144320, 'steps': 5959, 'loss/train': 1.015513300895691} +11/06/2021 22:05:21 - INFO - __main__ - Step 5961: {'lr': 0.0004991172840756204, 'samples': 1144512, 'steps': 5960, 'loss/train': 1.6141202449798584} +11/06/2021 22:05:22 - INFO - __main__ - Step 5962: {'lr': 0.000499116838465911, 'samples': 1144704, 'steps': 5961, 'loss/train': 2.2520675659179688} +11/06/2021 22:05:22 - INFO - __main__ - Step 5963: {'lr': 0.0004991163927439533, 'samples': 1144896, 'steps': 5962, 'loss/train': 2.061602830886841} +11/06/2021 22:05:22 - INFO - __main__ - Step 5964: {'lr': 0.0004991159469097476, 'samples': 1145088, 'steps': 5963, 'loss/train': 1.7788499593734741} +11/06/2021 22:05:23 - INFO - __main__ - Step 5965: {'lr': 0.0004991155009632941, 'samples': 1145280, 'steps': 5964, 'loss/train': 2.016207456588745} +11/06/2021 22:05:23 - INFO - __main__ - Step 5966: {'lr': 0.0004991150549045931, 'samples': 1145472, 'steps': 5965, 'loss/train': 2.390394926071167} +11/06/2021 22:05:24 - INFO - __main__ - Step 5967: {'lr': 0.0004991146087336446, 'samples': 1145664, 'steps': 5966, 'loss/train': 2.1438944339752197} +11/06/2021 22:05:24 - INFO - __main__ - Step 5968: {'lr': 0.0004991141624504489, 'samples': 1145856, 'steps': 5967, 'loss/train': 2.0830070972442627} +11/06/2021 22:05:25 - INFO - __main__ - Step 5969: {'lr': 0.0004991137160550062, 'samples': 1146048, 'steps': 5968, 'loss/train': 1.9556607007980347} +11/06/2021 22:05:25 - INFO - __main__ - Step 5970: {'lr': 0.0004991132695473167, 'samples': 1146240, 'steps': 5969, 'loss/train': 1.7997961044311523} +11/06/2021 22:05:25 - INFO - __main__ - Step 5971: {'lr': 0.0004991128229273807, 'samples': 1146432, 'steps': 5970, 'loss/train': 2.2100391387939453} +11/06/2021 22:05:26 - INFO - __main__ - Step 5972: {'lr': 0.0004991123761951982, 'samples': 1146624, 'steps': 5971, 'loss/train': 2.2720751762390137} +11/06/2021 22:05:27 - INFO - __main__ - Step 5973: {'lr': 0.0004991119293507695, 'samples': 1146816, 'steps': 5972, 'loss/train': 2.5560436248779297} +11/06/2021 22:05:27 - INFO - __main__ - Step 5974: {'lr': 0.0004991114823940948, 'samples': 1147008, 'steps': 5973, 'loss/train': 1.9444048404693604} +11/06/2021 22:05:27 - INFO - __main__ - Step 5975: {'lr': 0.0004991110353251744, 'samples': 1147200, 'steps': 5974, 'loss/train': 1.894894003868103} +11/06/2021 22:05:28 - INFO - __main__ - Step 5976: {'lr': 0.0004991105881440084, 'samples': 1147392, 'steps': 5975, 'loss/train': 1.42281174659729} +11/06/2021 22:05:29 - INFO - __main__ - Step 5977: {'lr': 0.000499110140850597, 'samples': 1147584, 'steps': 5976, 'loss/train': 1.4847767353057861} +11/06/2021 22:05:29 - INFO - __main__ - Step 5978: {'lr': 0.0004991096934449404, 'samples': 1147776, 'steps': 5977, 'loss/train': 1.5438770055770874} +11/06/2021 22:05:30 - INFO - __main__ - Step 5979: {'lr': 0.0004991092459270388, 'samples': 1147968, 'steps': 5978, 'loss/train': 1.8954336643218994} +11/06/2021 22:05:30 - INFO - __main__ - Step 5980: {'lr': 0.0004991087982968924, 'samples': 1148160, 'steps': 5979, 'loss/train': 1.413256287574768} +11/06/2021 22:05:30 - INFO - __main__ - Step 5981: {'lr': 0.0004991083505545014, 'samples': 1148352, 'steps': 5980, 'loss/train': 2.335400104522705} +11/06/2021 22:05:31 - INFO - __main__ - Step 5982: {'lr': 0.0004991079026998662, 'samples': 1148544, 'steps': 5981, 'loss/train': 1.8564774990081787} +11/06/2021 22:05:32 - INFO - __main__ - Step 5983: {'lr': 0.0004991074547329867, 'samples': 1148736, 'steps': 5982, 'loss/train': 2.0363080501556396} +11/06/2021 22:05:32 - INFO - __main__ - Step 5984: {'lr': 0.0004991070066538632, 'samples': 1148928, 'steps': 5983, 'loss/train': 1.7715718746185303} +11/06/2021 22:05:32 - INFO - __main__ - Step 5985: {'lr': 0.0004991065584624959, 'samples': 1149120, 'steps': 5984, 'loss/train': 2.119075059890747} +11/06/2021 22:05:33 - INFO - __main__ - Step 5986: {'lr': 0.0004991061101588851, 'samples': 1149312, 'steps': 5985, 'loss/train': 1.6880245208740234} +11/06/2021 22:05:33 - INFO - __main__ - Step 5987: {'lr': 0.0004991056617430308, 'samples': 1149504, 'steps': 5986, 'loss/train': 1.5863991975784302} +11/06/2021 22:05:34 - INFO - __main__ - Step 5988: {'lr': 0.0004991052132149336, 'samples': 1149696, 'steps': 5987, 'loss/train': 1.918567419052124} +11/06/2021 22:05:35 - INFO - __main__ - Step 5989: {'lr': 0.0004991047645745932, 'samples': 1149888, 'steps': 5988, 'loss/train': 2.1846141815185547} +11/06/2021 22:05:35 - INFO - __main__ - Step 5990: {'lr': 0.0004991043158220101, 'samples': 1150080, 'steps': 5989, 'loss/train': 0.287127822637558} +11/06/2021 22:05:35 - INFO - __main__ - Step 5991: {'lr': 0.0004991038669571844, 'samples': 1150272, 'steps': 5990, 'loss/train': 2.2613940238952637} +11/06/2021 22:05:36 - INFO - __main__ - Step 5992: {'lr': 0.0004991034179801165, 'samples': 1150464, 'steps': 5991, 'loss/train': 2.2237813472747803} +11/06/2021 22:05:37 - INFO - __main__ - Step 5993: {'lr': 0.0004991029688908063, 'samples': 1150656, 'steps': 5992, 'loss/train': 1.6125682592391968} +11/06/2021 22:05:37 - INFO - __main__ - Step 5994: {'lr': 0.0004991025196892542, 'samples': 1150848, 'steps': 5993, 'loss/train': 2.0412638187408447} +11/06/2021 22:05:37 - INFO - __main__ - Step 5995: {'lr': 0.0004991020703754603, 'samples': 1151040, 'steps': 5994, 'loss/train': 2.479659080505371} +11/06/2021 22:05:38 - INFO - __main__ - Step 5996: {'lr': 0.0004991016209494249, 'samples': 1151232, 'steps': 5995, 'loss/train': 1.6935555934906006} +11/06/2021 22:05:38 - INFO - __main__ - Step 5997: {'lr': 0.000499101171411148, 'samples': 1151424, 'steps': 5996, 'loss/train': 1.8328980207443237} +11/06/2021 22:05:39 - INFO - __main__ - Step 5998: {'lr': 0.0004991007217606303, 'samples': 1151616, 'steps': 5997, 'loss/train': 1.736120343208313} +11/06/2021 22:05:39 - INFO - __main__ - Step 5999: {'lr': 0.0004991002719978713, 'samples': 1151808, 'steps': 5998, 'loss/train': 1.7928426265716553} +11/06/2021 22:05:40 - INFO - __main__ - Step 6000: {'lr': 0.0004990998221228718, 'samples': 1152000, 'steps': 5999, 'loss/train': 2.1965417861938477} +11/06/2021 22:05:40 - INFO - __main__ - Step 6001: {'lr': 0.0004990993721356316, 'samples': 1152192, 'steps': 6000, 'loss/train': 1.9689626693725586} +11/06/2021 22:05:41 - INFO - __main__ - Step 6002: {'lr': 0.0004990989220361511, 'samples': 1152384, 'steps': 6001, 'loss/train': 2.398984670639038} +11/06/2021 22:05:42 - INFO - __main__ - Step 6003: {'lr': 0.0004990984718244306, 'samples': 1152576, 'steps': 6002, 'loss/train': 1.8467917442321777} +11/06/2021 22:05:42 - INFO - __main__ - Step 6004: {'lr': 0.00049909802150047, 'samples': 1152768, 'steps': 6003, 'loss/train': 1.9117133617401123} +11/06/2021 22:05:42 - INFO - __main__ - Step 6005: {'lr': 0.0004990975710642699, 'samples': 1152960, 'steps': 6004, 'loss/train': 2.0805423259735107} +11/06/2021 22:05:43 - INFO - __main__ - Step 6006: {'lr': 0.0004990971205158301, 'samples': 1153152, 'steps': 6005, 'loss/train': 1.9245171546936035} +11/06/2021 22:05:43 - INFO - __main__ - Step 6007: {'lr': 0.000499096669855151, 'samples': 1153344, 'steps': 6006, 'loss/train': 1.9373234510421753} +11/06/2021 22:05:44 - INFO - __main__ - Step 6008: {'lr': 0.0004990962190822328, 'samples': 1153536, 'steps': 6007, 'loss/train': 2.0879454612731934} +11/06/2021 22:05:44 - INFO - __main__ - Step 6009: {'lr': 0.0004990957681970757, 'samples': 1153728, 'steps': 6008, 'loss/train': 1.5155565738677979} +11/06/2021 22:05:45 - INFO - __main__ - Step 6010: {'lr': 0.0004990953171996798, 'samples': 1153920, 'steps': 6009, 'loss/train': 1.890929937362671} +11/06/2021 22:05:45 - INFO - __main__ - Step 6011: {'lr': 0.0004990948660900455, 'samples': 1154112, 'steps': 6010, 'loss/train': 1.6468206644058228} +11/06/2021 22:05:45 - INFO - __main__ - Step 6012: {'lr': 0.0004990944148681729, 'samples': 1154304, 'steps': 6011, 'loss/train': 1.8808773756027222} +11/06/2021 22:05:46 - INFO - __main__ - Step 6013: {'lr': 0.0004990939635340621, 'samples': 1154496, 'steps': 6012, 'loss/train': 1.6922487020492554} +11/06/2021 22:05:47 - INFO - __main__ - Step 6014: {'lr': 0.0004990935120877136, 'samples': 1154688, 'steps': 6013, 'loss/train': 1.5045371055603027} +11/06/2021 22:05:47 - INFO - __main__ - Step 6015: {'lr': 0.0004990930605291272, 'samples': 1154880, 'steps': 6014, 'loss/train': 1.9965391159057617} +11/06/2021 22:05:47 - INFO - __main__ - Step 6016: {'lr': 0.0004990926088583034, 'samples': 1155072, 'steps': 6015, 'loss/train': 1.9830745458602905} +11/06/2021 22:05:48 - INFO - __main__ - Step 6017: {'lr': 0.0004990921570752424, 'samples': 1155264, 'steps': 6016, 'loss/train': 1.850488305091858} +11/06/2021 22:05:49 - INFO - __main__ - Step 6018: {'lr': 0.0004990917051799442, 'samples': 1155456, 'steps': 6017, 'loss/train': 2.0463662147521973} +11/06/2021 22:05:49 - INFO - __main__ - Step 6019: {'lr': 0.0004990912531724092, 'samples': 1155648, 'steps': 6018, 'loss/train': 1.561757206916809} +11/06/2021 22:05:50 - INFO - __main__ - Step 6020: {'lr': 0.0004990908010526374, 'samples': 1155840, 'steps': 6019, 'loss/train': 2.3812918663024902} +11/06/2021 22:05:50 - INFO - __main__ - Step 6021: {'lr': 0.0004990903488206292, 'samples': 1156032, 'steps': 6020, 'loss/train': 1.9738842248916626} +11/06/2021 22:05:50 - INFO - __main__ - Step 6022: {'lr': 0.0004990898964763847, 'samples': 1156224, 'steps': 6021, 'loss/train': 1.0704938173294067} +11/06/2021 22:05:51 - INFO - __main__ - Step 6023: {'lr': 0.0004990894440199042, 'samples': 1156416, 'steps': 6022, 'loss/train': 2.2078778743743896} +11/06/2021 22:05:52 - INFO - __main__ - Step 6024: {'lr': 0.0004990889914511878, 'samples': 1156608, 'steps': 6023, 'loss/train': 1.3262114524841309} +11/06/2021 22:05:52 - INFO - __main__ - Step 6025: {'lr': 0.0004990885387702357, 'samples': 1156800, 'steps': 6024, 'loss/train': 2.6244781017303467} +11/06/2021 22:05:52 - INFO - __main__ - Step 6026: {'lr': 0.0004990880859770483, 'samples': 1156992, 'steps': 6025, 'loss/train': 2.0771734714508057} +11/06/2021 22:05:53 - INFO - __main__ - Step 6027: {'lr': 0.0004990876330716256, 'samples': 1157184, 'steps': 6026, 'loss/train': 1.7819007635116577} +11/06/2021 22:05:53 - INFO - __main__ - Step 6028: {'lr': 0.0004990871800539677, 'samples': 1157376, 'steps': 6027, 'loss/train': 2.1311354637145996} +11/06/2021 22:05:54 - INFO - __main__ - Step 6029: {'lr': 0.0004990867269240751, 'samples': 1157568, 'steps': 6028, 'loss/train': 2.2152881622314453} +11/06/2021 22:05:55 - INFO - __main__ - Step 6030: {'lr': 0.0004990862736819478, 'samples': 1157760, 'steps': 6029, 'loss/train': 2.027174949645996} +11/06/2021 22:05:55 - INFO - __main__ - Step 6031: {'lr': 0.000499085820327586, 'samples': 1157952, 'steps': 6030, 'loss/train': 1.750157356262207} +11/06/2021 22:05:55 - INFO - __main__ - Step 6032: {'lr': 0.0004990853668609902, 'samples': 1158144, 'steps': 6031, 'loss/train': 1.8239428997039795} +11/06/2021 22:05:56 - INFO - __main__ - Step 6033: {'lr': 0.0004990849132821602, 'samples': 1158336, 'steps': 6032, 'loss/train': 1.92527437210083} +11/06/2021 22:05:57 - INFO - __main__ - Step 6034: {'lr': 0.0004990844595910965, 'samples': 1158528, 'steps': 6033, 'loss/train': 2.1087069511413574} +11/06/2021 22:05:57 - INFO - __main__ - Step 6035: {'lr': 0.0004990840057877991, 'samples': 1158720, 'steps': 6034, 'loss/train': 1.7086195945739746} +11/06/2021 22:05:57 - INFO - __main__ - Step 6036: {'lr': 0.0004990835518722683, 'samples': 1158912, 'steps': 6035, 'loss/train': 1.736742615699768} +11/06/2021 22:05:58 - INFO - __main__ - Step 6037: {'lr': 0.0004990830978445043, 'samples': 1159104, 'steps': 6036, 'loss/train': 2.061073064804077} +11/06/2021 22:05:58 - INFO - __main__ - Step 6038: {'lr': 0.0004990826437045073, 'samples': 1159296, 'steps': 6037, 'loss/train': 1.51176917552948} +11/06/2021 22:05:59 - INFO - __main__ - Step 6039: {'lr': 0.0004990821894522775, 'samples': 1159488, 'steps': 6038, 'loss/train': 2.080949306488037} +11/06/2021 22:05:59 - INFO - __main__ - Step 6040: {'lr': 0.0004990817350878152, 'samples': 1159680, 'steps': 6039, 'loss/train': 1.2319962978363037} +11/06/2021 22:06:00 - INFO - __main__ - Step 6041: {'lr': 0.0004990812806111205, 'samples': 1159872, 'steps': 6040, 'loss/train': 2.2004785537719727} +11/06/2021 22:06:00 - INFO - __main__ - Step 6042: {'lr': 0.0004990808260221934, 'samples': 1160064, 'steps': 6041, 'loss/train': 2.198143243789673} +11/06/2021 22:06:00 - INFO - __main__ - Step 6043: {'lr': 0.0004990803713210345, 'samples': 1160256, 'steps': 6042, 'loss/train': 2.189502716064453} +11/06/2021 22:06:01 - INFO - __main__ - Step 6044: {'lr': 0.0004990799165076438, 'samples': 1160448, 'steps': 6043, 'loss/train': 0.32099586725234985} +11/06/2021 22:06:02 - INFO - __main__ - Step 6045: {'lr': 0.0004990794615820216, 'samples': 1160640, 'steps': 6044, 'loss/train': 2.055501937866211} +11/06/2021 22:06:02 - INFO - __main__ - Step 6046: {'lr': 0.0004990790065441679, 'samples': 1160832, 'steps': 6045, 'loss/train': 2.4283854961395264} +11/06/2021 22:06:03 - INFO - __main__ - Step 6047: {'lr': 0.0004990785513940832, 'samples': 1161024, 'steps': 6046, 'loss/train': 1.5293772220611572} +11/06/2021 22:06:03 - INFO - __main__ - Step 6048: {'lr': 0.0004990780961317674, 'samples': 1161216, 'steps': 6047, 'loss/train': 1.82656729221344} +11/06/2021 22:06:04 - INFO - __main__ - Step 6049: {'lr': 0.0004990776407572209, 'samples': 1161408, 'steps': 6048, 'loss/train': 2.004995107650757} +11/06/2021 22:06:04 - INFO - __main__ - Step 6050: {'lr': 0.000499077185270444, 'samples': 1161600, 'steps': 6049, 'loss/train': 1.4372830390930176} +11/06/2021 22:06:05 - INFO - __main__ - Step 6051: {'lr': 0.0004990767296714365, 'samples': 1161792, 'steps': 6050, 'loss/train': 1.7014871835708618} +11/06/2021 22:06:05 - INFO - __main__ - Step 6052: {'lr': 0.000499076273960199, 'samples': 1161984, 'steps': 6051, 'loss/train': 2.0586600303649902} +11/06/2021 22:06:05 - INFO - __main__ - Step 6053: {'lr': 0.0004990758181367316, 'samples': 1162176, 'steps': 6052, 'loss/train': 1.914888858795166} +11/06/2021 22:06:06 - INFO - __main__ - Step 6054: {'lr': 0.0004990753622010345, 'samples': 1162368, 'steps': 6053, 'loss/train': 2.2003793716430664} +11/06/2021 22:06:06 - INFO - __main__ - Step 6055: {'lr': 0.0004990749061531079, 'samples': 1162560, 'steps': 6054, 'loss/train': 2.1446890830993652} +11/06/2021 22:06:07 - INFO - __main__ - Step 6056: {'lr': 0.0004990744499929519, 'samples': 1162752, 'steps': 6055, 'loss/train': 1.890893578529358} +11/06/2021 22:06:07 - INFO - __main__ - Step 6057: {'lr': 0.0004990739937205668, 'samples': 1162944, 'steps': 6056, 'loss/train': 1.2735779285430908} +11/06/2021 22:06:08 - INFO - __main__ - Step 6058: {'lr': 0.0004990735373359529, 'samples': 1163136, 'steps': 6057, 'loss/train': 1.9701690673828125} +11/06/2021 22:06:08 - INFO - __main__ - Step 6059: {'lr': 0.0004990730808391102, 'samples': 1163328, 'steps': 6058, 'loss/train': 2.143030881881714} +11/06/2021 22:06:09 - INFO - __main__ - Step 6060: {'lr': 0.0004990726242300391, 'samples': 1163520, 'steps': 6059, 'loss/train': 2.049363613128662} +11/06/2021 22:06:09 - INFO - __main__ - Step 6061: {'lr': 0.0004990721675087397, 'samples': 1163712, 'steps': 6060, 'loss/train': 2.1596553325653076} +11/06/2021 22:06:10 - INFO - __main__ - Step 6062: {'lr': 0.0004990717106752122, 'samples': 1163904, 'steps': 6061, 'loss/train': 2.0180513858795166} +11/06/2021 22:06:10 - INFO - __main__ - Step 6063: {'lr': 0.0004990712537294568, 'samples': 1164096, 'steps': 6062, 'loss/train': 2.0434930324554443} +11/06/2021 22:06:10 - INFO - __main__ - Step 6064: {'lr': 0.0004990707966714738, 'samples': 1164288, 'steps': 6063, 'loss/train': 1.9746204614639282} +11/06/2021 22:06:11 - INFO - __main__ - Step 6065: {'lr': 0.0004990703395012634, 'samples': 1164480, 'steps': 6064, 'loss/train': 2.094088554382324} +11/06/2021 22:06:12 - INFO - __main__ - Step 6066: {'lr': 0.0004990698822188255, 'samples': 1164672, 'steps': 6065, 'loss/train': 1.3795504570007324} +11/06/2021 22:06:12 - INFO - __main__ - Step 6067: {'lr': 0.0004990694248241608, 'samples': 1164864, 'steps': 6066, 'loss/train': 2.1936051845550537} +11/06/2021 22:06:12 - INFO - __main__ - Step 6068: {'lr': 0.0004990689673172691, 'samples': 1165056, 'steps': 6067, 'loss/train': 2.1371805667877197} +11/06/2021 22:06:13 - INFO - __main__ - Step 6069: {'lr': 0.000499068509698151, 'samples': 1165248, 'steps': 6068, 'loss/train': 1.7530931234359741} +11/06/2021 22:06:14 - INFO - __main__ - Step 6070: {'lr': 0.0004990680519668063, 'samples': 1165440, 'steps': 6069, 'loss/train': 2.192474842071533} +11/06/2021 22:06:14 - INFO - __main__ - Step 6071: {'lr': 0.0004990675941232354, 'samples': 1165632, 'steps': 6070, 'loss/train': 1.666622281074524} +11/06/2021 22:06:15 - INFO - __main__ - Step 6072: {'lr': 0.0004990671361674384, 'samples': 1165824, 'steps': 6071, 'loss/train': 1.9727286100387573} +11/06/2021 22:06:15 - INFO - __main__ - Step 6073: {'lr': 0.0004990666780994156, 'samples': 1166016, 'steps': 6072, 'loss/train': 2.116274356842041} +11/06/2021 22:06:15 - INFO - __main__ - Step 6074: {'lr': 0.0004990662199191673, 'samples': 1166208, 'steps': 6073, 'loss/train': 2.271106243133545} +11/06/2021 22:06:16 - INFO - __main__ - Step 6075: {'lr': 0.0004990657616266936, 'samples': 1166400, 'steps': 6074, 'loss/train': 1.8674793243408203} +11/06/2021 22:06:17 - INFO - __main__ - Step 6076: {'lr': 0.0004990653032219947, 'samples': 1166592, 'steps': 6075, 'loss/train': 1.4734982252120972} +11/06/2021 22:06:17 - INFO - __main__ - Step 6077: {'lr': 0.0004990648447050709, 'samples': 1166784, 'steps': 6076, 'loss/train': 1.8218048810958862} +11/06/2021 22:06:17 - INFO - __main__ - Step 6078: {'lr': 0.0004990643860759222, 'samples': 1166976, 'steps': 6077, 'loss/train': 1.642020583152771} +11/06/2021 22:06:18 - INFO - __main__ - Step 6079: {'lr': 0.0004990639273345489, 'samples': 1167168, 'steps': 6078, 'loss/train': 1.3877575397491455} +11/06/2021 22:06:18 - INFO - __main__ - Step 6080: {'lr': 0.0004990634684809513, 'samples': 1167360, 'steps': 6079, 'loss/train': 1.8536438941955566} +11/06/2021 22:06:19 - INFO - __main__ - Step 6081: {'lr': 0.0004990630095151296, 'samples': 1167552, 'steps': 6080, 'loss/train': 2.0661253929138184} +11/06/2021 22:06:19 - INFO - __main__ - Step 6082: {'lr': 0.0004990625504370838, 'samples': 1167744, 'steps': 6081, 'loss/train': 1.9790138006210327} +11/06/2021 22:06:20 - INFO - __main__ - Step 6083: {'lr': 0.0004990620912468143, 'samples': 1167936, 'steps': 6082, 'loss/train': 1.5834496021270752} +11/06/2021 22:06:20 - INFO - __main__ - Step 6084: {'lr': 0.0004990616319443214, 'samples': 1168128, 'steps': 6083, 'loss/train': 1.8926007747650146} +11/06/2021 22:06:20 - INFO - __main__ - Step 6085: {'lr': 0.0004990611725296052, 'samples': 1168320, 'steps': 6084, 'loss/train': 1.9960976839065552} +11/06/2021 22:06:21 - INFO - __main__ - Step 6086: {'lr': 0.0004990607130026657, 'samples': 1168512, 'steps': 6085, 'loss/train': 2.563918113708496} +11/06/2021 22:06:22 - INFO - __main__ - Step 6087: {'lr': 0.0004990602533635033, 'samples': 1168704, 'steps': 6086, 'loss/train': 1.8031913042068481} +11/06/2021 22:06:22 - INFO - __main__ - Step 6088: {'lr': 0.0004990597936121182, 'samples': 1168896, 'steps': 6087, 'loss/train': 1.5920250415802002} +11/06/2021 22:06:22 - INFO - __main__ - Step 6089: {'lr': 0.0004990593337485108, 'samples': 1169088, 'steps': 6088, 'loss/train': 2.1160354614257812} +11/06/2021 22:06:23 - INFO - __main__ - Step 6090: {'lr': 0.0004990588737726809, 'samples': 1169280, 'steps': 6089, 'loss/train': 2.0593221187591553} +11/06/2021 22:06:24 - INFO - __main__ - Step 6091: {'lr': 0.0004990584136846289, 'samples': 1169472, 'steps': 6090, 'loss/train': 2.7556521892547607} +11/06/2021 22:06:24 - INFO - __main__ - Step 6092: {'lr': 0.0004990579534843551, 'samples': 1169664, 'steps': 6091, 'loss/train': 2.4434940814971924} +11/06/2021 22:06:24 - INFO - __main__ - Step 6093: {'lr': 0.0004990574931718597, 'samples': 1169856, 'steps': 6092, 'loss/train': 2.342974901199341} +11/06/2021 22:06:25 - INFO - __main__ - Step 6094: {'lr': 0.0004990570327471427, 'samples': 1170048, 'steps': 6093, 'loss/train': 1.9696969985961914} +11/06/2021 22:06:25 - INFO - __main__ - Step 6095: {'lr': 0.0004990565722102045, 'samples': 1170240, 'steps': 6094, 'loss/train': 1.6603606939315796} +11/06/2021 22:06:26 - INFO - __main__ - Step 6096: {'lr': 0.0004990561115610452, 'samples': 1170432, 'steps': 6095, 'loss/train': 1.3589533567428589} +11/06/2021 22:06:26 - INFO - __main__ - Step 6097: {'lr': 0.0004990556507996652, 'samples': 1170624, 'steps': 6096, 'loss/train': 1.9999220371246338} +11/06/2021 22:06:27 - INFO - __main__ - Step 6098: {'lr': 0.0004990551899260644, 'samples': 1170816, 'steps': 6097, 'loss/train': 1.987586498260498} +11/06/2021 22:06:27 - INFO - __main__ - Step 6099: {'lr': 0.0004990547289402433, 'samples': 1171008, 'steps': 6098, 'loss/train': 1.9792393445968628} +11/06/2021 22:06:27 - INFO - __main__ - Step 6100: {'lr': 0.0004990542678422019, 'samples': 1171200, 'steps': 6099, 'loss/train': 1.7970731258392334} +11/06/2021 22:06:29 - INFO - __main__ - Step 6101: {'lr': 0.0004990538066319406, 'samples': 1171392, 'steps': 6100, 'loss/train': 1.9069502353668213} +11/06/2021 22:06:29 - INFO - __main__ - Step 6102: {'lr': 0.0004990533453094594, 'samples': 1171584, 'steps': 6101, 'loss/train': 1.354381799697876} +11/06/2021 22:06:29 - INFO - __main__ - Step 6103: {'lr': 0.0004990528838747586, 'samples': 1171776, 'steps': 6102, 'loss/train': 1.948202133178711} +11/06/2021 22:06:30 - INFO - __main__ - Step 6104: {'lr': 0.0004990524223278384, 'samples': 1171968, 'steps': 6103, 'loss/train': 1.6591429710388184} +11/06/2021 22:06:30 - INFO - __main__ - Step 6105: {'lr': 0.0004990519606686991, 'samples': 1172160, 'steps': 6104, 'loss/train': 2.1720986366271973} +11/06/2021 22:06:31 - INFO - __main__ - Step 6106: {'lr': 0.0004990514988973408, 'samples': 1172352, 'steps': 6105, 'loss/train': 2.1691129207611084} +11/06/2021 22:06:31 - INFO - __main__ - Step 6107: {'lr': 0.0004990510370137637, 'samples': 1172544, 'steps': 6106, 'loss/train': 1.6799395084381104} +11/06/2021 22:06:32 - INFO - __main__ - Step 6108: {'lr': 0.0004990505750179682, 'samples': 1172736, 'steps': 6107, 'loss/train': 1.9363466501235962} +11/06/2021 22:06:32 - INFO - __main__ - Step 6109: {'lr': 0.0004990501129099542, 'samples': 1172928, 'steps': 6108, 'loss/train': 1.7905744314193726} +11/06/2021 22:06:32 - INFO - __main__ - Step 6110: {'lr': 0.000499049650689722, 'samples': 1173120, 'steps': 6109, 'loss/train': 1.5997885465621948} +11/06/2021 22:06:33 - INFO - __main__ - Step 6111: {'lr': 0.000499049188357272, 'samples': 1173312, 'steps': 6110, 'loss/train': 2.1724469661712646} +11/06/2021 22:06:34 - INFO - __main__ - Step 6112: {'lr': 0.0004990487259126043, 'samples': 1173504, 'steps': 6111, 'loss/train': 1.6976191997528076} +11/06/2021 22:06:34 - INFO - __main__ - Step 6113: {'lr': 0.0004990482633557189, 'samples': 1173696, 'steps': 6112, 'loss/train': 1.716886281967163} +11/06/2021 22:06:34 - INFO - __main__ - Step 6114: {'lr': 0.0004990478006866165, 'samples': 1173888, 'steps': 6113, 'loss/train': 1.6597141027450562} +11/06/2021 22:06:35 - INFO - __main__ - Step 6115: {'lr': 0.0004990473379052968, 'samples': 1174080, 'steps': 6114, 'loss/train': 2.12764835357666} +11/06/2021 22:06:36 - INFO - __main__ - Step 6116: {'lr': 0.0004990468750117602, 'samples': 1174272, 'steps': 6115, 'loss/train': 1.4543788433074951} +11/06/2021 22:06:36 - INFO - __main__ - Step 6117: {'lr': 0.000499046412006007, 'samples': 1174464, 'steps': 6116, 'loss/train': 1.662864327430725} +11/06/2021 22:06:37 - INFO - __main__ - Step 6118: {'lr': 0.0004990459488880372, 'samples': 1174656, 'steps': 6117, 'loss/train': 1.5874830484390259} +11/06/2021 22:06:37 - INFO - __main__ - Step 6119: {'lr': 0.0004990454856578513, 'samples': 1174848, 'steps': 6118, 'loss/train': 1.8817105293273926} +11/06/2021 22:06:37 - INFO - __main__ - Step 6120: {'lr': 0.0004990450223154492, 'samples': 1175040, 'steps': 6119, 'loss/train': 1.8093229532241821} +11/06/2021 22:06:38 - INFO - __main__ - Step 6121: {'lr': 0.0004990445588608313, 'samples': 1175232, 'steps': 6120, 'loss/train': 1.6032285690307617} +11/06/2021 22:06:39 - INFO - __main__ - Step 6122: {'lr': 0.0004990440952939979, 'samples': 1175424, 'steps': 6121, 'loss/train': 2.429919719696045} +11/06/2021 22:06:39 - INFO - __main__ - Step 6123: {'lr': 0.0004990436316149489, 'samples': 1175616, 'steps': 6122, 'loss/train': 1.6632248163223267} +11/06/2021 22:06:40 - INFO - __main__ - Step 6124: {'lr': 0.0004990431678236849, 'samples': 1175808, 'steps': 6123, 'loss/train': 1.8044439554214478} +11/06/2021 22:06:40 - INFO - __main__ - Step 6125: {'lr': 0.0004990427039202057, 'samples': 1176000, 'steps': 6124, 'loss/train': 1.9963434934616089} +11/06/2021 22:06:40 - INFO - __main__ - Step 6126: {'lr': 0.0004990422399045117, 'samples': 1176192, 'steps': 6125, 'loss/train': 1.9155720472335815} +11/06/2021 22:06:41 - INFO - __main__ - Step 6127: {'lr': 0.0004990417757766031, 'samples': 1176384, 'steps': 6126, 'loss/train': 1.775386929512024} +11/06/2021 22:06:42 - INFO - __main__ - Step 6128: {'lr': 0.0004990413115364803, 'samples': 1176576, 'steps': 6127, 'loss/train': 1.5602920055389404} +11/06/2021 22:06:42 - INFO - __main__ - Step 6129: {'lr': 0.0004990408471841431, 'samples': 1176768, 'steps': 6128, 'loss/train': 2.0410501956939697} +11/06/2021 22:06:42 - INFO - __main__ - Step 6130: {'lr': 0.0004990403827195921, 'samples': 1176960, 'steps': 6129, 'loss/train': 2.2790169715881348} +11/06/2021 22:06:43 - INFO - __main__ - Step 6131: {'lr': 0.0004990399181428273, 'samples': 1177152, 'steps': 6130, 'loss/train': 2.0821285247802734} +11/06/2021 22:06:44 - INFO - __main__ - Step 6132: {'lr': 0.000499039453453849, 'samples': 1177344, 'steps': 6131, 'loss/train': 1.8965604305267334} +11/06/2021 22:06:44 - INFO - __main__ - Step 6133: {'lr': 0.0004990389886526573, 'samples': 1177536, 'steps': 6132, 'loss/train': 1.8164457082748413} +11/06/2021 22:06:44 - INFO - __main__ - Step 6134: {'lr': 0.0004990385237392524, 'samples': 1177728, 'steps': 6133, 'loss/train': 1.9925854206085205} +11/06/2021 22:06:45 - INFO - __main__ - Step 6135: {'lr': 0.0004990380587136347, 'samples': 1177920, 'steps': 6134, 'loss/train': 1.2192782163619995} +11/06/2021 22:06:45 - INFO - __main__ - Step 6136: {'lr': 0.0004990375935758042, 'samples': 1178112, 'steps': 6135, 'loss/train': 1.5371315479278564} +11/06/2021 22:06:46 - INFO - __main__ - Step 6137: {'lr': 0.0004990371283257613, 'samples': 1178304, 'steps': 6136, 'loss/train': 1.8077142238616943} +11/06/2021 22:06:47 - INFO - __main__ - Step 6138: {'lr': 0.0004990366629635062, 'samples': 1178496, 'steps': 6137, 'loss/train': 2.013735771179199} +11/06/2021 22:06:47 - INFO - __main__ - Step 6139: {'lr': 0.0004990361974890388, 'samples': 1178688, 'steps': 6138, 'loss/train': 2.858919620513916} +11/06/2021 22:06:47 - INFO - __main__ - Step 6140: {'lr': 0.0004990357319023597, 'samples': 1178880, 'steps': 6139, 'loss/train': 1.368839144706726} +11/06/2021 22:06:48 - INFO - __main__ - Step 6141: {'lr': 0.0004990352662034689, 'samples': 1179072, 'steps': 6140, 'loss/train': 1.362464427947998} +11/06/2021 22:06:49 - INFO - __main__ - Step 6142: {'lr': 0.0004990348003923665, 'samples': 1179264, 'steps': 6141, 'loss/train': 1.9596736431121826} +11/06/2021 22:06:49 - INFO - __main__ - Step 6143: {'lr': 0.000499034334469053, 'samples': 1179456, 'steps': 6142, 'loss/train': 2.131988048553467} +11/06/2021 22:06:50 - INFO - __main__ - Step 6144: {'lr': 0.0004990338684335285, 'samples': 1179648, 'steps': 6143, 'loss/train': 1.4277572631835938} +11/06/2021 22:06:50 - INFO - __main__ - Step 6145: {'lr': 0.0004990334022857932, 'samples': 1179840, 'steps': 6144, 'loss/train': 1.9954853057861328} +11/06/2021 22:06:50 - INFO - __main__ - Step 6146: {'lr': 0.0004990329360258472, 'samples': 1180032, 'steps': 6145, 'loss/train': 1.7441011667251587} +11/06/2021 22:06:51 - INFO - __main__ - Step 6147: {'lr': 0.0004990324696536908, 'samples': 1180224, 'steps': 6146, 'loss/train': 0.7077341079711914} +11/06/2021 22:06:52 - INFO - __main__ - Step 6148: {'lr': 0.0004990320031693242, 'samples': 1180416, 'steps': 6147, 'loss/train': 2.2118520736694336} +11/06/2021 22:06:52 - INFO - __main__ - Step 6149: {'lr': 0.0004990315365727476, 'samples': 1180608, 'steps': 6148, 'loss/train': 2.055332660675049} +11/06/2021 22:06:52 - INFO - __main__ - Step 6150: {'lr': 0.0004990310698639614, 'samples': 1180800, 'steps': 6149, 'loss/train': 2.1165621280670166} +11/06/2021 22:06:53 - INFO - __main__ - Step 6151: {'lr': 0.0004990306030429655, 'samples': 1180992, 'steps': 6150, 'loss/train': 1.5419307947158813} +11/06/2021 22:06:53 - INFO - __main__ - Step 6152: {'lr': 0.0004990301361097603, 'samples': 1181184, 'steps': 6151, 'loss/train': 1.1245484352111816} +11/06/2021 22:06:54 - INFO - __main__ - Step 6153: {'lr': 0.000499029669064346, 'samples': 1181376, 'steps': 6152, 'loss/train': 2.3590290546417236} +11/06/2021 22:06:54 - INFO - __main__ - Step 6154: {'lr': 0.0004990292019067227, 'samples': 1181568, 'steps': 6153, 'loss/train': 1.9370914697647095} +11/06/2021 22:06:55 - INFO - __main__ - Step 6155: {'lr': 0.0004990287346368908, 'samples': 1181760, 'steps': 6154, 'loss/train': 2.3206193447113037} +11/06/2021 22:06:55 - INFO - __main__ - Step 6156: {'lr': 0.0004990282672548503, 'samples': 1181952, 'steps': 6155, 'loss/train': 1.679478645324707} +11/06/2021 22:06:56 - INFO - __main__ - Step 6157: {'lr': 0.0004990277997606016, 'samples': 1182144, 'steps': 6156, 'loss/train': 1.524378776550293} +11/06/2021 22:06:56 - INFO - __main__ - Step 6158: {'lr': 0.0004990273321541447, 'samples': 1182336, 'steps': 6157, 'loss/train': 0.6619194149971008} +11/06/2021 22:06:57 - INFO - __main__ - Step 6159: {'lr': 0.0004990268644354799, 'samples': 1182528, 'steps': 6158, 'loss/train': 1.9400123357772827} +11/06/2021 22:06:57 - INFO - __main__ - Step 6160: {'lr': 0.0004990263966046075, 'samples': 1182720, 'steps': 6159, 'loss/train': 1.8187702894210815} +11/06/2021 22:06:57 - INFO - __main__ - Step 6161: {'lr': 0.0004990259286615276, 'samples': 1182912, 'steps': 6160, 'loss/train': 1.444914698600769} +11/06/2021 22:06:58 - INFO - __main__ - Step 6162: {'lr': 0.0004990254606062406, 'samples': 1183104, 'steps': 6161, 'loss/train': 1.4133529663085938} +11/06/2021 22:06:59 - INFO - __main__ - Step 6163: {'lr': 0.0004990249924387465, 'samples': 1183296, 'steps': 6162, 'loss/train': 1.8153014183044434} +11/06/2021 22:06:59 - INFO - __main__ - Step 6164: {'lr': 0.0004990245241590455, 'samples': 1183488, 'steps': 6163, 'loss/train': 1.761313796043396} +11/06/2021 22:07:00 - INFO - __main__ - Step 6165: {'lr': 0.0004990240557671379, 'samples': 1183680, 'steps': 6164, 'loss/train': 0.9687419533729553} +11/06/2021 22:07:00 - INFO - __main__ - Step 6166: {'lr': 0.000499023587263024, 'samples': 1183872, 'steps': 6165, 'loss/train': 1.6445512771606445} +11/06/2021 22:07:00 - INFO - __main__ - Step 6167: {'lr': 0.0004990231186467039, 'samples': 1184064, 'steps': 6166, 'loss/train': 1.3879804611206055} +11/06/2021 22:07:01 - INFO - __main__ - Step 6168: {'lr': 0.0004990226499181778, 'samples': 1184256, 'steps': 6167, 'loss/train': 2.506103992462158} +11/06/2021 22:07:02 - INFO - __main__ - Step 6169: {'lr': 0.0004990221810774459, 'samples': 1184448, 'steps': 6168, 'loss/train': 2.4504177570343018} +11/06/2021 22:07:02 - INFO - __main__ - Step 6170: {'lr': 0.0004990217121245084, 'samples': 1184640, 'steps': 6169, 'loss/train': 1.9792548418045044} +11/06/2021 22:07:02 - INFO - __main__ - Step 6171: {'lr': 0.0004990212430593657, 'samples': 1184832, 'steps': 6170, 'loss/train': 1.8940435647964478} +11/06/2021 22:07:03 - INFO - __main__ - Step 6172: {'lr': 0.0004990207738820178, 'samples': 1185024, 'steps': 6171, 'loss/train': 1.8361660242080688} +11/06/2021 22:07:04 - INFO - __main__ - Step 6173: {'lr': 0.000499020304592465, 'samples': 1185216, 'steps': 6172, 'loss/train': 2.492899179458618} +11/06/2021 22:07:04 - INFO - __main__ - Step 6174: {'lr': 0.0004990198351907075, 'samples': 1185408, 'steps': 6173, 'loss/train': 1.5003889799118042} +11/06/2021 22:07:04 - INFO - __main__ - Step 6175: {'lr': 0.0004990193656767455, 'samples': 1185600, 'steps': 6174, 'loss/train': 2.0811853408813477} +11/06/2021 22:07:05 - INFO - __main__ - Step 6176: {'lr': 0.0004990188960505792, 'samples': 1185792, 'steps': 6175, 'loss/train': 3.0719258785247803} +11/06/2021 22:07:05 - INFO - __main__ - Step 6177: {'lr': 0.0004990184263122088, 'samples': 1185984, 'steps': 6176, 'loss/train': 1.861528754234314} +11/06/2021 22:07:05 - INFO - __main__ - Step 6178: {'lr': 0.0004990179564616346, 'samples': 1186176, 'steps': 6177, 'loss/train': 5.958117485046387} +11/06/2021 22:07:07 - INFO - __main__ - Step 6179: {'lr': 0.0004990174864988566, 'samples': 1186368, 'steps': 6178, 'loss/train': 1.926222562789917} +11/06/2021 22:07:07 - INFO - __main__ - Step 6180: {'lr': 0.0004990170164238754, 'samples': 1186560, 'steps': 6179, 'loss/train': 1.9009610414505005} +11/06/2021 22:07:07 - INFO - __main__ - Step 6181: {'lr': 0.0004990165462366909, 'samples': 1186752, 'steps': 6180, 'loss/train': 2.4664011001586914} +11/06/2021 22:07:08 - INFO - __main__ - Step 6182: {'lr': 0.0004990160759373033, 'samples': 1186944, 'steps': 6181, 'loss/train': 2.10902738571167} +11/06/2021 22:07:08 - INFO - __main__ - Step 6183: {'lr': 0.0004990156055257129, 'samples': 1187136, 'steps': 6182, 'loss/train': 1.813493251800537} +11/06/2021 22:07:09 - INFO - __main__ - Step 6184: {'lr': 0.00049901513500192, 'samples': 1187328, 'steps': 6183, 'loss/train': 2.25309681892395} +11/06/2021 22:07:09 - INFO - __main__ - Step 6185: {'lr': 0.0004990146643659247, 'samples': 1187520, 'steps': 6184, 'loss/train': 2.2059273719787598} +11/06/2021 22:07:10 - INFO - __main__ - Step 6186: {'lr': 0.0004990141936177272, 'samples': 1187712, 'steps': 6185, 'loss/train': 2.0499684810638428} +11/06/2021 22:07:10 - INFO - __main__ - Step 6187: {'lr': 0.0004990137227573278, 'samples': 1187904, 'steps': 6186, 'loss/train': 3.2400269508361816} +11/06/2021 22:07:10 - INFO - __main__ - Step 6188: {'lr': 0.0004990132517847266, 'samples': 1188096, 'steps': 6187, 'loss/train': 1.8898727893829346} +11/06/2021 22:07:11 - INFO - __main__ - Step 6189: {'lr': 0.0004990127806999239, 'samples': 1188288, 'steps': 6188, 'loss/train': 0.9931958317756653} +11/06/2021 22:07:12 - INFO - __main__ - Step 6190: {'lr': 0.0004990123095029199, 'samples': 1188480, 'steps': 6189, 'loss/train': 1.6618373394012451} +11/06/2021 22:07:12 - INFO - __main__ - Step 6191: {'lr': 0.0004990118381937148, 'samples': 1188672, 'steps': 6190, 'loss/train': 1.4901134967803955} +11/06/2021 22:07:12 - INFO - __main__ - Step 6192: {'lr': 0.0004990113667723088, 'samples': 1188864, 'steps': 6191, 'loss/train': 1.1681599617004395} +11/06/2021 22:07:13 - INFO - __main__ - Step 6193: {'lr': 0.000499010895238702, 'samples': 1189056, 'steps': 6192, 'loss/train': 1.8815301656723022} +11/06/2021 22:07:14 - INFO - __main__ - Step 6194: {'lr': 0.0004990104235928948, 'samples': 1189248, 'steps': 6193, 'loss/train': 1.8837906122207642} +11/06/2021 22:07:14 - INFO - __main__ - Step 6195: {'lr': 0.0004990099518348874, 'samples': 1189440, 'steps': 6194, 'loss/train': 2.526460647583008} +11/06/2021 22:07:14 - INFO - __main__ - Step 6196: {'lr': 0.00049900947996468, 'samples': 1189632, 'steps': 6195, 'loss/train': 1.910827875137329} +11/06/2021 22:07:15 - INFO - __main__ - Step 6197: {'lr': 0.0004990090079822726, 'samples': 1189824, 'steps': 6196, 'loss/train': 2.300349473953247} +11/06/2021 22:07:15 - INFO - __main__ - Step 6198: {'lr': 0.0004990085358876658, 'samples': 1190016, 'steps': 6197, 'loss/train': 1.6927975416183472} +11/06/2021 22:07:16 - INFO - __main__ - Step 6199: {'lr': 0.0004990080636808595, 'samples': 1190208, 'steps': 6198, 'loss/train': 2.1126410961151123} +11/06/2021 22:07:17 - INFO - __main__ - Step 6200: {'lr': 0.000499007591361854, 'samples': 1190400, 'steps': 6199, 'loss/train': 1.71726393699646} +11/06/2021 22:07:17 - INFO - __main__ - Step 6201: {'lr': 0.0004990071189306495, 'samples': 1190592, 'steps': 6200, 'loss/train': 2.024538040161133} +11/06/2021 22:07:17 - INFO - __main__ - Step 6202: {'lr': 0.0004990066463872462, 'samples': 1190784, 'steps': 6201, 'loss/train': 1.7335742712020874} +11/06/2021 22:07:18 - INFO - __main__ - Step 6203: {'lr': 0.0004990061737316445, 'samples': 1190976, 'steps': 6202, 'loss/train': 1.7096867561340332} +11/06/2021 22:07:18 - INFO - __main__ - Step 6204: {'lr': 0.0004990057009638443, 'samples': 1191168, 'steps': 6203, 'loss/train': 1.5593353509902954} +11/06/2021 22:07:19 - INFO - __main__ - Step 6205: {'lr': 0.000499005228083846, 'samples': 1191360, 'steps': 6204, 'loss/train': 2.450568437576294} +11/06/2021 22:07:20 - INFO - __main__ - Step 6206: {'lr': 0.0004990047550916498, 'samples': 1191552, 'steps': 6205, 'loss/train': 2.2195775508880615} +11/06/2021 22:07:20 - INFO - __main__ - Step 6207: {'lr': 0.000499004281987256, 'samples': 1191744, 'steps': 6206, 'loss/train': 1.6635841131210327} +11/06/2021 22:07:20 - INFO - __main__ - Step 6208: {'lr': 0.0004990038087706646, 'samples': 1191936, 'steps': 6207, 'loss/train': 1.9627450704574585} +11/06/2021 22:07:21 - INFO - __main__ - Step 6209: {'lr': 0.000499003335441876, 'samples': 1192128, 'steps': 6208, 'loss/train': 2.254753351211548} +11/06/2021 22:07:22 - INFO - __main__ - Step 6210: {'lr': 0.0004990028620008903, 'samples': 1192320, 'steps': 6209, 'loss/train': 1.8182693719863892} +11/06/2021 22:07:22 - INFO - __main__ - Step 6211: {'lr': 0.0004990023884477077, 'samples': 1192512, 'steps': 6210, 'loss/train': 2.1537516117095947} +11/06/2021 22:07:23 - INFO - __main__ - Step 6212: {'lr': 0.0004990019147823286, 'samples': 1192704, 'steps': 6211, 'loss/train': 1.6900304555892944} +11/06/2021 22:07:23 - INFO - __main__ - Step 6213: {'lr': 0.000499001441004753, 'samples': 1192896, 'steps': 6212, 'loss/train': 0.32827237248420715} +11/06/2021 22:07:23 - INFO - __main__ - Step 6214: {'lr': 0.0004990009671149811, 'samples': 1193088, 'steps': 6213, 'loss/train': 1.9133497476577759} +11/06/2021 22:07:24 - INFO - __main__ - Step 6215: {'lr': 0.0004990004931130133, 'samples': 1193280, 'steps': 6214, 'loss/train': 2.055999994277954} +11/06/2021 22:07:25 - INFO - __main__ - Step 6216: {'lr': 0.0004990000189988497, 'samples': 1193472, 'steps': 6215, 'loss/train': 2.248798370361328} +11/06/2021 22:07:25 - INFO - __main__ - Step 6217: {'lr': 0.0004989995447724907, 'samples': 1193664, 'steps': 6216, 'loss/train': 1.8303406238555908} +11/06/2021 22:07:26 - INFO - __main__ - Step 6218: {'lr': 0.0004989990704339361, 'samples': 1193856, 'steps': 6217, 'loss/train': 1.0167715549468994} +11/06/2021 22:07:26 - INFO - __main__ - Step 6219: {'lr': 0.0004989985959831865, 'samples': 1194048, 'steps': 6218, 'loss/train': 1.4236408472061157} +11/06/2021 22:07:27 - INFO - __main__ - Step 6220: {'lr': 0.0004989981214202419, 'samples': 1194240, 'steps': 6219, 'loss/train': 2.0307483673095703} +11/06/2021 22:07:28 - INFO - __main__ - Step 6221: {'lr': 0.0004989976467451026, 'samples': 1194432, 'steps': 6220, 'loss/train': 2.141268253326416} +11/06/2021 22:07:28 - INFO - __main__ - Step 6222: {'lr': 0.0004989971719577688, 'samples': 1194624, 'steps': 6221, 'loss/train': 1.8791309595108032} +11/06/2021 22:07:28 - INFO - __main__ - Step 6223: {'lr': 0.0004989966970582408, 'samples': 1194816, 'steps': 6222, 'loss/train': 1.7829779386520386} +11/06/2021 22:07:29 - INFO - __main__ - Step 6224: {'lr': 0.0004989962220465187, 'samples': 1195008, 'steps': 6223, 'loss/train': 4.018397331237793} +11/06/2021 22:07:29 - INFO - __main__ - Step 6225: {'lr': 0.0004989957469226027, 'samples': 1195200, 'steps': 6224, 'loss/train': 0.3159443736076355} +11/06/2021 22:07:30 - INFO - __main__ - Step 6226: {'lr': 0.0004989952716864931, 'samples': 1195392, 'steps': 6225, 'loss/train': 2.1702065467834473} +11/06/2021 22:07:30 - INFO - __main__ - Step 6227: {'lr': 0.00049899479633819, 'samples': 1195584, 'steps': 6226, 'loss/train': 1.8308675289154053} +11/06/2021 22:07:31 - INFO - __main__ - Step 6228: {'lr': 0.0004989943208776938, 'samples': 1195776, 'steps': 6227, 'loss/train': 2.180677890777588} +11/06/2021 22:07:31 - INFO - __main__ - Step 6229: {'lr': 0.0004989938453050045, 'samples': 1195968, 'steps': 6228, 'loss/train': 1.6663007736206055} +11/06/2021 22:07:31 - INFO - __main__ - Step 6230: {'lr': 0.0004989933696201225, 'samples': 1196160, 'steps': 6229, 'loss/train': 1.936288595199585} +11/06/2021 22:07:33 - INFO - __main__ - Step 6231: {'lr': 0.0004989928938230478, 'samples': 1196352, 'steps': 6230, 'loss/train': 2.008770227432251} +11/06/2021 22:07:33 - INFO - __main__ - Step 6232: {'lr': 0.0004989924179137808, 'samples': 1196544, 'steps': 6231, 'loss/train': 2.004091501235962} +11/06/2021 22:07:33 - INFO - __main__ - Step 6233: {'lr': 0.0004989919418923218, 'samples': 1196736, 'steps': 6232, 'loss/train': 1.9655420780181885} +11/06/2021 22:07:34 - INFO - __main__ - Step 6234: {'lr': 0.0004989914657586707, 'samples': 1196928, 'steps': 6233, 'loss/train': 1.8493226766586304} +11/06/2021 22:07:34 - INFO - __main__ - Step 6235: {'lr': 0.000498990989512828, 'samples': 1197120, 'steps': 6234, 'loss/train': 2.194037675857544} +11/06/2021 22:07:35 - INFO - __main__ - Step 6236: {'lr': 0.0004989905131547937, 'samples': 1197312, 'steps': 6235, 'loss/train': 2.581127643585205} +11/06/2021 22:07:35 - INFO - __main__ - Step 6237: {'lr': 0.0004989900366845682, 'samples': 1197504, 'steps': 6236, 'loss/train': 2.2226333618164062} +11/06/2021 22:07:36 - INFO - __main__ - Step 6238: {'lr': 0.0004989895601021515, 'samples': 1197696, 'steps': 6237, 'loss/train': 2.466501235961914} +11/06/2021 22:07:36 - INFO - __main__ - Step 6239: {'lr': 0.0004989890834075441, 'samples': 1197888, 'steps': 6238, 'loss/train': 1.5966987609863281} +11/06/2021 22:07:36 - INFO - __main__ - Step 6240: {'lr': 0.000498988606600746, 'samples': 1198080, 'steps': 6239, 'loss/train': 1.8267741203308105} +11/06/2021 22:07:37 - INFO - __main__ - Step 6241: {'lr': 0.0004989881296817575, 'samples': 1198272, 'steps': 6240, 'loss/train': 2.1044561862945557} +11/06/2021 22:07:38 - INFO - __main__ - Step 6242: {'lr': 0.0004989876526505788, 'samples': 1198464, 'steps': 6241, 'loss/train': 1.7580589056015015} +11/06/2021 22:07:38 - INFO - __main__ - Step 6243: {'lr': 0.0004989871755072101, 'samples': 1198656, 'steps': 6242, 'loss/train': 1.8593974113464355} +11/06/2021 22:07:38 - INFO - __main__ - Step 6244: {'lr': 0.0004989866982516516, 'samples': 1198848, 'steps': 6243, 'loss/train': 1.7739224433898926} +11/06/2021 22:07:39 - INFO - __main__ - Step 6245: {'lr': 0.0004989862208839035, 'samples': 1199040, 'steps': 6244, 'loss/train': 2.1439409255981445} +11/06/2021 22:07:40 - INFO - __main__ - Step 6246: {'lr': 0.0004989857434039661, 'samples': 1199232, 'steps': 6245, 'loss/train': 1.7785552740097046} +11/06/2021 22:07:40 - INFO - __main__ - Step 6247: {'lr': 0.0004989852658118395, 'samples': 1199424, 'steps': 6246, 'loss/train': 0.6885305047035217} +11/06/2021 22:07:41 - INFO - __main__ - Step 6248: {'lr': 0.000498984788107524, 'samples': 1199616, 'steps': 6247, 'loss/train': 1.918849229812622} +11/06/2021 22:07:41 - INFO - __main__ - Step 6249: {'lr': 0.0004989843102910198, 'samples': 1199808, 'steps': 6248, 'loss/train': 1.5366085767745972} +11/06/2021 22:07:41 - INFO - __main__ - Step 6250: {'lr': 0.0004989838323623272, 'samples': 1200000, 'steps': 6249, 'loss/train': 2.3803365230560303} +11/06/2021 22:07:42 - INFO - __main__ - Step 6251: {'lr': 0.0004989833543214463, 'samples': 1200192, 'steps': 6250, 'loss/train': 1.9775062799453735} +11/06/2021 22:07:43 - INFO - __main__ - Step 6252: {'lr': 0.0004989828761683774, 'samples': 1200384, 'steps': 6251, 'loss/train': 1.7551454305648804} +11/06/2021 22:07:43 - INFO - __main__ - Step 6253: {'lr': 0.0004989823979031205, 'samples': 1200576, 'steps': 6252, 'loss/train': 1.5888711214065552} +11/06/2021 22:07:43 - INFO - __main__ - Step 6254: {'lr': 0.000498981919525676, 'samples': 1200768, 'steps': 6253, 'loss/train': 1.925179362297058} +11/06/2021 22:07:44 - INFO - __main__ - Step 6255: {'lr': 0.0004989814410360442, 'samples': 1200960, 'steps': 6254, 'loss/train': 0.6360993981361389} +11/06/2021 22:07:45 - INFO - __main__ - Step 6256: {'lr': 0.0004989809624342251, 'samples': 1201152, 'steps': 6255, 'loss/train': 1.8095260858535767} +11/06/2021 22:07:45 - INFO - __main__ - Step 6257: {'lr': 0.000498980483720219, 'samples': 1201344, 'steps': 6256, 'loss/train': 1.7746502161026} +11/06/2021 22:07:46 - INFO - __main__ - Step 6258: {'lr': 0.0004989800048940263, 'samples': 1201536, 'steps': 6257, 'loss/train': 2.096313953399658} +11/06/2021 22:07:46 - INFO - __main__ - Step 6259: {'lr': 0.0004989795259556469, 'samples': 1201728, 'steps': 6258, 'loss/train': 2.1959168910980225} +11/06/2021 22:07:46 - INFO - __main__ - Step 6260: {'lr': 0.0004989790469050813, 'samples': 1201920, 'steps': 6259, 'loss/train': 1.8663018941879272} +11/06/2021 22:07:47 - INFO - __main__ - Step 6261: {'lr': 0.0004989785677423295, 'samples': 1202112, 'steps': 6260, 'loss/train': 1.3765881061553955} +11/06/2021 22:07:47 - INFO - __main__ - Step 6262: {'lr': 0.0004989780884673917, 'samples': 1202304, 'steps': 6261, 'loss/train': 2.113983631134033} +11/06/2021 22:07:48 - INFO - __main__ - Step 6263: {'lr': 0.0004989776090802683, 'samples': 1202496, 'steps': 6262, 'loss/train': 2.6338729858398438} +11/06/2021 22:07:48 - INFO - __main__ - Step 6264: {'lr': 0.0004989771295809594, 'samples': 1202688, 'steps': 6263, 'loss/train': 1.5440324544906616} +11/06/2021 22:07:49 - INFO - __main__ - Step 6265: {'lr': 0.0004989766499694653, 'samples': 1202880, 'steps': 6264, 'loss/train': 2.112800121307373} +11/06/2021 22:07:50 - INFO - __main__ - Step 6266: {'lr': 0.0004989761702457862, 'samples': 1203072, 'steps': 6265, 'loss/train': 1.9621334075927734} +11/06/2021 22:07:50 - INFO - __main__ - Step 6267: {'lr': 0.0004989756904099222, 'samples': 1203264, 'steps': 6266, 'loss/train': 2.0875959396362305} +11/06/2021 22:07:50 - INFO - __main__ - Step 6268: {'lr': 0.0004989752104618736, 'samples': 1203456, 'steps': 6267, 'loss/train': 2.009376287460327} +11/06/2021 22:07:51 - INFO - __main__ - Step 6269: {'lr': 0.0004989747304016407, 'samples': 1203648, 'steps': 6268, 'loss/train': 2.29427433013916} +11/06/2021 22:07:51 - INFO - __main__ - Step 6270: {'lr': 0.0004989742502292235, 'samples': 1203840, 'steps': 6269, 'loss/train': 2.1417438983917236} +11/06/2021 22:07:52 - INFO - __main__ - Step 6271: {'lr': 0.0004989737699446225, 'samples': 1204032, 'steps': 6270, 'loss/train': 1.981139063835144} +11/06/2021 22:07:52 - INFO - __main__ - Step 6272: {'lr': 0.0004989732895478376, 'samples': 1204224, 'steps': 6271, 'loss/train': 1.8909876346588135} +11/06/2021 22:07:53 - INFO - __main__ - Step 6273: {'lr': 0.0004989728090388693, 'samples': 1204416, 'steps': 6272, 'loss/train': 1.6940367221832275} +11/06/2021 22:07:53 - INFO - __main__ - Step 6274: {'lr': 0.0004989723284177177, 'samples': 1204608, 'steps': 6273, 'loss/train': 2.325897216796875} +11/06/2021 22:07:53 - INFO - __main__ - Step 6275: {'lr': 0.0004989718476843828, 'samples': 1204800, 'steps': 6274, 'loss/train': 1.9315811395645142} +11/06/2021 22:07:54 - INFO - __main__ - Step 6276: {'lr': 0.0004989713668388652, 'samples': 1204992, 'steps': 6275, 'loss/train': 1.894089937210083} +11/06/2021 22:07:55 - INFO - __main__ - Step 6277: {'lr': 0.000498970885881165, 'samples': 1205184, 'steps': 6276, 'loss/train': 1.7275776863098145} +11/06/2021 22:07:55 - INFO - __main__ - Step 6278: {'lr': 0.0004989704048112823, 'samples': 1205376, 'steps': 6277, 'loss/train': 2.880239486694336} +11/06/2021 22:07:55 - INFO - __main__ - Step 6279: {'lr': 0.0004989699236292173, 'samples': 1205568, 'steps': 6278, 'loss/train': 1.9111852645874023} +11/06/2021 22:07:56 - INFO - __main__ - Step 6280: {'lr': 0.0004989694423349704, 'samples': 1205760, 'steps': 6279, 'loss/train': 2.0868144035339355} +11/06/2021 22:07:57 - INFO - __main__ - Step 6281: {'lr': 0.0004989689609285417, 'samples': 1205952, 'steps': 6280, 'loss/train': 2.3991446495056152} +11/06/2021 22:07:57 - INFO - __main__ - Step 6282: {'lr': 0.0004989684794099314, 'samples': 1206144, 'steps': 6281, 'loss/train': 1.962192177772522} +11/06/2021 22:07:57 - INFO - __main__ - Step 6283: {'lr': 0.0004989679977791397, 'samples': 1206336, 'steps': 6282, 'loss/train': 2.007171630859375} +11/06/2021 22:07:58 - INFO - __main__ - Step 6284: {'lr': 0.0004989675160361669, 'samples': 1206528, 'steps': 6283, 'loss/train': 2.0830070972442627} +11/06/2021 22:07:58 - INFO - __main__ - Step 6285: {'lr': 0.0004989670341810132, 'samples': 1206720, 'steps': 6284, 'loss/train': 1.7555127143859863} +11/06/2021 22:07:59 - INFO - __main__ - Step 6286: {'lr': 0.0004989665522136789, 'samples': 1206912, 'steps': 6285, 'loss/train': 1.7010811567306519} +11/06/2021 22:08:00 - INFO - __main__ - Step 6287: {'lr': 0.0004989660701341639, 'samples': 1207104, 'steps': 6286, 'loss/train': 1.6270495653152466} +11/06/2021 22:08:00 - INFO - __main__ - Step 6288: {'lr': 0.0004989655879424687, 'samples': 1207296, 'steps': 6287, 'loss/train': 0.33006778359413147} +11/06/2021 22:08:00 - INFO - __main__ - Step 6289: {'lr': 0.0004989651056385936, 'samples': 1207488, 'steps': 6288, 'loss/train': 1.9551554918289185} +11/06/2021 22:08:01 - INFO - __main__ - Step 6290: {'lr': 0.0004989646232225384, 'samples': 1207680, 'steps': 6289, 'loss/train': 5.657275199890137} +11/06/2021 22:08:01 - INFO - __main__ - Step 6291: {'lr': 0.0004989641406943037, 'samples': 1207872, 'steps': 6290, 'loss/train': 1.931122899055481} +11/06/2021 22:08:02 - INFO - __main__ - Step 6292: {'lr': 0.0004989636580538896, 'samples': 1208064, 'steps': 6291, 'loss/train': 1.3750081062316895} +11/06/2021 22:08:02 - INFO - __main__ - Step 6293: {'lr': 0.0004989631753012964, 'samples': 1208256, 'steps': 6292, 'loss/train': 2.0061533451080322} +11/06/2021 22:08:03 - INFO - __main__ - Step 6294: {'lr': 0.0004989626924365242, 'samples': 1208448, 'steps': 6293, 'loss/train': 1.9302148818969727} +11/06/2021 22:08:03 - INFO - __main__ - Step 6295: {'lr': 0.0004989622094595733, 'samples': 1208640, 'steps': 6294, 'loss/train': 2.0548641681671143} +11/06/2021 22:08:03 - INFO - __main__ - Step 6296: {'lr': 0.0004989617263704437, 'samples': 1208832, 'steps': 6295, 'loss/train': 1.7614363431930542} +11/06/2021 22:08:05 - INFO - __main__ - Step 6297: {'lr': 0.0004989612431691359, 'samples': 1209024, 'steps': 6296, 'loss/train': 1.5389564037322998} +11/06/2021 22:08:05 - INFO - __main__ - Step 6298: {'lr': 0.0004989607598556501, 'samples': 1209216, 'steps': 6297, 'loss/train': 2.1703968048095703} +11/06/2021 22:08:05 - INFO - __main__ - Step 6299: {'lr': 0.0004989602764299862, 'samples': 1209408, 'steps': 6298, 'loss/train': 1.22577702999115} +11/06/2021 22:08:06 - INFO - __main__ - Step 6300: {'lr': 0.0004989597928921447, 'samples': 1209600, 'steps': 6299, 'loss/train': 2.2829113006591797} +11/06/2021 22:08:06 - INFO - __main__ - Step 6301: {'lr': 0.0004989593092421258, 'samples': 1209792, 'steps': 6300, 'loss/train': 1.3044848442077637} +11/06/2021 22:08:06 - INFO - __main__ - Step 6302: {'lr': 0.0004989588254799297, 'samples': 1209984, 'steps': 6301, 'loss/train': 1.8990617990493774} +11/06/2021 22:08:07 - INFO - __main__ - Step 6303: {'lr': 0.0004989583416055566, 'samples': 1210176, 'steps': 6302, 'loss/train': 1.9017807245254517} +11/06/2021 22:08:08 - INFO - __main__ - Step 6304: {'lr': 0.0004989578576190068, 'samples': 1210368, 'steps': 6303, 'loss/train': 2.0887370109558105} +11/06/2021 22:08:08 - INFO - __main__ - Step 6305: {'lr': 0.0004989573735202802, 'samples': 1210560, 'steps': 6304, 'loss/train': 1.910634994506836} +11/06/2021 22:08:08 - INFO - __main__ - Step 6306: {'lr': 0.0004989568893093774, 'samples': 1210752, 'steps': 6305, 'loss/train': 1.4305139780044556} +11/06/2021 22:08:09 - INFO - __main__ - Step 6307: {'lr': 0.0004989564049862986, 'samples': 1210944, 'steps': 6306, 'loss/train': 1.7775681018829346} +11/06/2021 22:08:10 - INFO - __main__ - Step 6308: {'lr': 0.0004989559205510436, 'samples': 1211136, 'steps': 6307, 'loss/train': 1.7592074871063232} +11/06/2021 22:08:10 - INFO - __main__ - Step 6309: {'lr': 0.000498955436003613, 'samples': 1211328, 'steps': 6308, 'loss/train': 1.7411454916000366} +11/06/2021 22:08:10 - INFO - __main__ - Step 6310: {'lr': 0.0004989549513440071, 'samples': 1211520, 'steps': 6309, 'loss/train': 2.116926431655884} +11/06/2021 22:08:11 - INFO - __main__ - Step 6311: {'lr': 0.0004989544665722258, 'samples': 1211712, 'steps': 6310, 'loss/train': 1.8361932039260864} +11/06/2021 22:08:11 - INFO - __main__ - Step 6312: {'lr': 0.0004989539816882694, 'samples': 1211904, 'steps': 6311, 'loss/train': 1.3926923274993896} +11/06/2021 22:08:12 - INFO - __main__ - Step 6313: {'lr': 0.0004989534966921382, 'samples': 1212096, 'steps': 6312, 'loss/train': 1.8578460216522217} +11/06/2021 22:08:13 - INFO - __main__ - Step 6314: {'lr': 0.0004989530115838324, 'samples': 1212288, 'steps': 6313, 'loss/train': 2.0698132514953613} +11/06/2021 22:08:13 - INFO - __main__ - Step 6315: {'lr': 0.0004989525263633523, 'samples': 1212480, 'steps': 6314, 'loss/train': 1.3116508722305298} +11/06/2021 22:08:13 - INFO - __main__ - Step 6316: {'lr': 0.0004989520410306979, 'samples': 1212672, 'steps': 6315, 'loss/train': 1.9149450063705444} +11/06/2021 22:08:14 - INFO - __main__ - Step 6317: {'lr': 0.0004989515555858697, 'samples': 1212864, 'steps': 6316, 'loss/train': 2.206059694290161} +11/06/2021 22:08:15 - INFO - __main__ - Step 6318: {'lr': 0.0004989510700288678, 'samples': 1213056, 'steps': 6317, 'loss/train': 1.6991815567016602} +11/06/2021 22:08:15 - INFO - __main__ - Step 6319: {'lr': 0.0004989505843596922, 'samples': 1213248, 'steps': 6318, 'loss/train': 2.7226216793060303} +11/06/2021 22:08:15 - INFO - __main__ - Step 6320: {'lr': 0.0004989500985783434, 'samples': 1213440, 'steps': 6319, 'loss/train': 2.1540679931640625} +11/06/2021 22:08:16 - INFO - __main__ - Step 6321: {'lr': 0.0004989496126848215, 'samples': 1213632, 'steps': 6320, 'loss/train': 1.8948540687561035} +11/06/2021 22:08:16 - INFO - __main__ - Step 6322: {'lr': 0.0004989491266791268, 'samples': 1213824, 'steps': 6321, 'loss/train': 1.8643752336502075} +11/06/2021 22:08:17 - INFO - __main__ - Step 6323: {'lr': 0.0004989486405612595, 'samples': 1214016, 'steps': 6322, 'loss/train': 1.8771063089370728} +11/06/2021 22:08:18 - INFO - __main__ - Step 6324: {'lr': 0.0004989481543312196, 'samples': 1214208, 'steps': 6323, 'loss/train': 1.7344616651535034} +11/06/2021 22:08:18 - INFO - __main__ - Step 6325: {'lr': 0.0004989476679890077, 'samples': 1214400, 'steps': 6324, 'loss/train': 1.7559272050857544} +11/06/2021 22:08:18 - INFO - __main__ - Step 6326: {'lr': 0.0004989471815346237, 'samples': 1214592, 'steps': 6325, 'loss/train': 2.1662731170654297} +11/06/2021 22:08:19 - INFO - __main__ - Step 6327: {'lr': 0.000498946694968068, 'samples': 1214784, 'steps': 6326, 'loss/train': 2.0608224868774414} +11/06/2021 22:08:19 - INFO - __main__ - Step 6328: {'lr': 0.0004989462082893407, 'samples': 1214976, 'steps': 6327, 'loss/train': 2.2688443660736084} +11/06/2021 22:08:20 - INFO - __main__ - Step 6329: {'lr': 0.0004989457214984421, 'samples': 1215168, 'steps': 6328, 'loss/train': 2.0150251388549805} +11/06/2021 22:08:20 - INFO - __main__ - Step 6330: {'lr': 0.0004989452345953725, 'samples': 1215360, 'steps': 6329, 'loss/train': 1.8572430610656738} +11/06/2021 22:08:21 - INFO - __main__ - Step 6331: {'lr': 0.000498944747580132, 'samples': 1215552, 'steps': 6330, 'loss/train': 1.986055850982666} +11/06/2021 22:08:21 - INFO - __main__ - Step 6332: {'lr': 0.0004989442604527208, 'samples': 1215744, 'steps': 6331, 'loss/train': 1.7587941884994507} +11/06/2021 22:08:21 - INFO - __main__ - Step 6333: {'lr': 0.0004989437732131391, 'samples': 1215936, 'steps': 6332, 'loss/train': 1.8428518772125244} +11/06/2021 22:08:23 - INFO - __main__ - Step 6334: {'lr': 0.0004989432858613873, 'samples': 1216128, 'steps': 6333, 'loss/train': 2.1033074855804443} +11/06/2021 22:08:23 - INFO - __main__ - Step 6335: {'lr': 0.0004989427983974653, 'samples': 1216320, 'steps': 6334, 'loss/train': 1.3180185556411743} +11/06/2021 22:08:23 - INFO - __main__ - Step 6336: {'lr': 0.0004989423108213737, 'samples': 1216512, 'steps': 6335, 'loss/train': 2.3260984420776367} +11/06/2021 22:08:24 - INFO - __main__ - Step 6337: {'lr': 0.0004989418231331124, 'samples': 1216704, 'steps': 6336, 'loss/train': 2.056525230407715} +11/06/2021 22:08:24 - INFO - __main__ - Step 6338: {'lr': 0.0004989413353326818, 'samples': 1216896, 'steps': 6337, 'loss/train': 2.151630401611328} +11/06/2021 22:08:25 - INFO - __main__ - Step 6339: {'lr': 0.0004989408474200821, 'samples': 1217088, 'steps': 6338, 'loss/train': 0.4232385456562042} +11/06/2021 22:08:25 - INFO - __main__ - Step 6340: {'lr': 0.0004989403593953135, 'samples': 1217280, 'steps': 6339, 'loss/train': 2.0424396991729736} +11/06/2021 22:08:26 - INFO - __main__ - Step 6341: {'lr': 0.0004989398712583762, 'samples': 1217472, 'steps': 6340, 'loss/train': 1.5621088743209839} +11/06/2021 22:08:26 - INFO - __main__ - Step 6342: {'lr': 0.0004989393830092705, 'samples': 1217664, 'steps': 6341, 'loss/train': 2.555983781814575} +11/06/2021 22:08:26 - INFO - __main__ - Step 6343: {'lr': 0.0004989388946479965, 'samples': 1217856, 'steps': 6342, 'loss/train': 1.820717692375183} +11/06/2021 22:08:27 - INFO - __main__ - Step 6344: {'lr': 0.0004989384061745545, 'samples': 1218048, 'steps': 6343, 'loss/train': 1.8627382516860962} +11/06/2021 22:08:28 - INFO - __main__ - Step 6345: {'lr': 0.0004989379175889447, 'samples': 1218240, 'steps': 6344, 'loss/train': 2.2447197437286377} +11/06/2021 22:08:28 - INFO - __main__ - Step 6346: {'lr': 0.0004989374288911672, 'samples': 1218432, 'steps': 6345, 'loss/train': 2.0814595222473145} +11/06/2021 22:08:28 - INFO - __main__ - Step 6347: {'lr': 0.0004989369400812225, 'samples': 1218624, 'steps': 6346, 'loss/train': 1.2773443460464478} +11/06/2021 22:08:29 - INFO - __main__ - Step 6348: {'lr': 0.0004989364511591106, 'samples': 1218816, 'steps': 6347, 'loss/train': 1.5852837562561035} +11/06/2021 22:08:29 - INFO - __main__ - Step 6349: {'lr': 0.0004989359621248317, 'samples': 1219008, 'steps': 6348, 'loss/train': 1.5508657693862915} +11/06/2021 22:08:30 - INFO - __main__ - Step 6350: {'lr': 0.0004989354729783861, 'samples': 1219200, 'steps': 6349, 'loss/train': 1.6555392742156982} +11/06/2021 22:08:31 - INFO - __main__ - Step 6351: {'lr': 0.0004989349837197742, 'samples': 1219392, 'steps': 6350, 'loss/train': 1.6861871480941772} +11/06/2021 22:08:31 - INFO - __main__ - Step 6352: {'lr': 0.0004989344943489958, 'samples': 1219584, 'steps': 6351, 'loss/train': 2.0413320064544678} +11/06/2021 22:08:31 - INFO - __main__ - Step 6353: {'lr': 0.0004989340048660515, 'samples': 1219776, 'steps': 6352, 'loss/train': 2.444296360015869} +11/06/2021 22:08:32 - INFO - __main__ - Step 6354: {'lr': 0.0004989335152709414, 'samples': 1219968, 'steps': 6353, 'loss/train': 2.159029245376587} +11/06/2021 22:08:33 - INFO - __main__ - Step 6355: {'lr': 0.0004989330255636656, 'samples': 1220160, 'steps': 6354, 'loss/train': 1.5128992795944214} +11/06/2021 22:08:33 - INFO - __main__ - Step 6356: {'lr': 0.0004989325357442245, 'samples': 1220352, 'steps': 6355, 'loss/train': 1.8759398460388184} +11/06/2021 22:08:33 - INFO - __main__ - Step 6357: {'lr': 0.0004989320458126182, 'samples': 1220544, 'steps': 6356, 'loss/train': 1.6384868621826172} +11/06/2021 22:08:34 - INFO - __main__ - Step 6358: {'lr': 0.0004989315557688469, 'samples': 1220736, 'steps': 6357, 'loss/train': 2.0724997520446777} +11/06/2021 22:08:34 - INFO - __main__ - Step 6359: {'lr': 0.000498931065612911, 'samples': 1220928, 'steps': 6358, 'loss/train': 1.3788177967071533} +11/06/2021 22:08:35 - INFO - __main__ - Step 6360: {'lr': 0.0004989305753448106, 'samples': 1221120, 'steps': 6359, 'loss/train': 1.6440093517303467} +11/06/2021 22:08:35 - INFO - __main__ - Step 6361: {'lr': 0.0004989300849645459, 'samples': 1221312, 'steps': 6360, 'loss/train': 0.8680780529975891} +11/06/2021 22:08:36 - INFO - __main__ - Step 6362: {'lr': 0.0004989295944721171, 'samples': 1221504, 'steps': 6361, 'loss/train': 1.834447979927063} +11/06/2021 22:08:36 - INFO - __main__ - Step 6363: {'lr': 0.0004989291038675245, 'samples': 1221696, 'steps': 6362, 'loss/train': 2.109246015548706} +11/06/2021 22:08:36 - INFO - __main__ - Step 6364: {'lr': 0.0004989286131507682, 'samples': 1221888, 'steps': 6363, 'loss/train': 2.3124148845672607} +11/06/2021 22:08:37 - INFO - __main__ - Step 6365: {'lr': 0.0004989281223218486, 'samples': 1222080, 'steps': 6364, 'loss/train': 2.2666964530944824} +11/06/2021 22:08:38 - INFO - __main__ - Step 6366: {'lr': 0.0004989276313807658, 'samples': 1222272, 'steps': 6365, 'loss/train': 2.1086597442626953} +11/06/2021 22:08:38 - INFO - __main__ - Step 6367: {'lr': 0.00049892714032752, 'samples': 1222464, 'steps': 6366, 'loss/train': 1.7961052656173706} +11/06/2021 22:08:39 - INFO - __main__ - Step 6368: {'lr': 0.0004989266491621117, 'samples': 1222656, 'steps': 6367, 'loss/train': 1.7916598320007324} +11/06/2021 22:08:39 - INFO - __main__ - Step 6369: {'lr': 0.0004989261578845406, 'samples': 1222848, 'steps': 6368, 'loss/train': 2.015110731124878} +11/06/2021 22:08:40 - INFO - __main__ - Step 6370: {'lr': 0.0004989256664948073, 'samples': 1223040, 'steps': 6369, 'loss/train': 1.7681583166122437} +11/06/2021 22:08:40 - INFO - __main__ - Step 6371: {'lr': 0.000498925174992912, 'samples': 1223232, 'steps': 6370, 'loss/train': 2.142261266708374} +11/06/2021 22:08:41 - INFO - __main__ - Step 6372: {'lr': 0.0004989246833788549, 'samples': 1223424, 'steps': 6371, 'loss/train': 1.6870710849761963} +11/06/2021 22:08:41 - INFO - __main__ - Step 6373: {'lr': 0.000498924191652636, 'samples': 1223616, 'steps': 6372, 'loss/train': 1.6174527406692505} +11/06/2021 22:08:41 - INFO - __main__ - Step 6374: {'lr': 0.0004989236998142559, 'samples': 1223808, 'steps': 6373, 'loss/train': 1.6731904745101929} +11/06/2021 22:08:42 - INFO - __main__ - Step 6375: {'lr': 0.0004989232078637145, 'samples': 1224000, 'steps': 6374, 'loss/train': 1.9477375745773315} +11/06/2021 22:08:44 - INFO - __main__ - Step 6376: {'lr': 0.0004989227158010123, 'samples': 1224192, 'steps': 6375, 'loss/train': 1.9696638584136963} +11/06/2021 22:08:44 - INFO - __main__ - Step 6377: {'lr': 0.0004989222236261491, 'samples': 1224384, 'steps': 6376, 'loss/train': 2.0389769077301025} +11/06/2021 22:08:45 - INFO - __main__ - Step 6378: {'lr': 0.0004989217313391256, 'samples': 1224576, 'steps': 6377, 'loss/train': 1.981373906135559} +11/06/2021 22:08:45 - INFO - __main__ - Step 6379: {'lr': 0.0004989212389399417, 'samples': 1224768, 'steps': 6378, 'loss/train': 1.8569397926330566} +11/06/2021 22:08:46 - INFO - __main__ - Step 6380: {'lr': 0.0004989207464285978, 'samples': 1224960, 'steps': 6379, 'loss/train': 1.8618382215499878} +11/06/2021 22:08:46 - INFO - __main__ - Step 6381: {'lr': 0.0004989202538050939, 'samples': 1225152, 'steps': 6380, 'loss/train': 1.969157099723816} +11/06/2021 22:08:46 - INFO - __main__ - Step 6382: {'lr': 0.0004989197610694306, 'samples': 1225344, 'steps': 6381, 'loss/train': 4.056380748748779} +11/06/2021 22:08:47 - INFO - __main__ - Step 6383: {'lr': 0.0004989192682216078, 'samples': 1225536, 'steps': 6382, 'loss/train': 2.3175463676452637} +11/06/2021 22:08:48 - INFO - __main__ - Step 6384: {'lr': 0.0004989187752616258, 'samples': 1225728, 'steps': 6383, 'loss/train': 2.1582441329956055} +11/06/2021 22:08:48 - INFO - __main__ - Step 6385: {'lr': 0.0004989182821894849, 'samples': 1225920, 'steps': 6384, 'loss/train': 1.9625952243804932} +11/06/2021 22:08:48 - INFO - __main__ - Step 6386: {'lr': 0.0004989177890051852, 'samples': 1226112, 'steps': 6385, 'loss/train': 2.3441145420074463} +11/06/2021 22:08:49 - INFO - __main__ - Step 6387: {'lr': 0.000498917295708727, 'samples': 1226304, 'steps': 6386, 'loss/train': 2.260986328125} +11/06/2021 22:08:49 - INFO - __main__ - Step 6388: {'lr': 0.0004989168023001105, 'samples': 1226496, 'steps': 6387, 'loss/train': 2.005218029022217} +11/06/2021 22:08:50 - INFO - __main__ - Step 6389: {'lr': 0.0004989163087793359, 'samples': 1226688, 'steps': 6388, 'loss/train': 1.657336950302124} +11/06/2021 22:08:50 - INFO - __main__ - Step 6390: {'lr': 0.0004989158151464036, 'samples': 1226880, 'steps': 6389, 'loss/train': 1.1649143695831299} +11/06/2021 22:08:51 - INFO - __main__ - Step 6391: {'lr': 0.0004989153214013135, 'samples': 1227072, 'steps': 6390, 'loss/train': 2.1878926753997803} +11/06/2021 22:08:51 - INFO - __main__ - Step 6392: {'lr': 0.0004989148275440661, 'samples': 1227264, 'steps': 6391, 'loss/train': 2.312974691390991} +11/06/2021 22:08:51 - INFO - __main__ - Step 6393: {'lr': 0.0004989143335746614, 'samples': 1227456, 'steps': 6392, 'loss/train': 2.0476460456848145} +11/06/2021 22:08:52 - INFO - __main__ - Step 6394: {'lr': 0.0004989138394930998, 'samples': 1227648, 'steps': 6393, 'loss/train': 2.358633518218994} +11/06/2021 22:08:53 - INFO - __main__ - Step 6395: {'lr': 0.0004989133452993816, 'samples': 1227840, 'steps': 6394, 'loss/train': 1.8311744928359985} +11/06/2021 22:08:53 - INFO - __main__ - Step 6396: {'lr': 0.0004989128509935068, 'samples': 1228032, 'steps': 6395, 'loss/train': 1.4626703262329102} +11/06/2021 22:08:53 - INFO - __main__ - Step 6397: {'lr': 0.0004989123565754756, 'samples': 1228224, 'steps': 6396, 'loss/train': 2.180896043777466} +11/06/2021 22:08:54 - INFO - __main__ - Step 6398: {'lr': 0.0004989118620452884, 'samples': 1228416, 'steps': 6397, 'loss/train': 1.6816266775131226} +11/06/2021 22:08:55 - INFO - __main__ - Step 6399: {'lr': 0.0004989113674029454, 'samples': 1228608, 'steps': 6398, 'loss/train': 2.068782091140747} +11/06/2021 22:08:55 - INFO - __main__ - Step 6400: {'lr': 0.0004989108726484469, 'samples': 1228800, 'steps': 6399, 'loss/train': 2.064892530441284} +11/06/2021 22:08:55 - INFO - __main__ - Step 6401: {'lr': 0.0004989103777817928, 'samples': 1228992, 'steps': 6400, 'loss/train': 1.7987390756607056} +11/06/2021 22:08:56 - INFO - __main__ - Step 6402: {'lr': 0.0004989098828029836, 'samples': 1229184, 'steps': 6401, 'loss/train': 2.1822431087493896} +11/06/2021 22:08:56 - INFO - __main__ - Step 6403: {'lr': 0.0004989093877120194, 'samples': 1229376, 'steps': 6402, 'loss/train': 1.9657015800476074} +11/06/2021 22:08:58 - INFO - __main__ - Step 6404: {'lr': 0.0004989088925089005, 'samples': 1229568, 'steps': 6403, 'loss/train': 1.4904416799545288} +11/06/2021 22:08:58 - INFO - __main__ - Step 6405: {'lr': 0.0004989083971936271, 'samples': 1229760, 'steps': 6404, 'loss/train': 2.7258121967315674} +11/06/2021 22:08:58 - INFO - __main__ - Step 6406: {'lr': 0.0004989079017661994, 'samples': 1229952, 'steps': 6405, 'loss/train': 1.961512804031372} +11/06/2021 22:08:59 - INFO - __main__ - Step 6407: {'lr': 0.0004989074062266177, 'samples': 1230144, 'steps': 6406, 'loss/train': 5.536162853240967} +11/06/2021 22:08:59 - INFO - __main__ - Step 6408: {'lr': 0.0004989069105748821, 'samples': 1230336, 'steps': 6407, 'loss/train': 1.5103638172149658} +11/06/2021 22:08:59 - INFO - __main__ - Step 6409: {'lr': 0.0004989064148109929, 'samples': 1230528, 'steps': 6408, 'loss/train': 1.6851413249969482} +11/06/2021 22:09:00 - INFO - __main__ - Step 6410: {'lr': 0.0004989059189349503, 'samples': 1230720, 'steps': 6409, 'loss/train': 1.7821619510650635} +11/06/2021 22:09:01 - INFO - __main__ - Step 6411: {'lr': 0.0004989054229467546, 'samples': 1230912, 'steps': 6410, 'loss/train': 1.9058226346969604} +11/06/2021 22:09:01 - INFO - __main__ - Step 6412: {'lr': 0.0004989049268464058, 'samples': 1231104, 'steps': 6411, 'loss/train': 1.1312766075134277} +11/06/2021 22:09:01 - INFO - __main__ - Step 6413: {'lr': 0.0004989044306339044, 'samples': 1231296, 'steps': 6412, 'loss/train': 2.2100672721862793} +11/06/2021 22:09:02 - INFO - __main__ - Step 6414: {'lr': 0.0004989039343092505, 'samples': 1231488, 'steps': 6413, 'loss/train': 1.6702120304107666} +11/06/2021 22:09:03 - INFO - __main__ - Step 6415: {'lr': 0.0004989034378724443, 'samples': 1231680, 'steps': 6414, 'loss/train': 2.1043949127197266} +11/06/2021 22:09:03 - INFO - __main__ - Step 6416: {'lr': 0.0004989029413234861, 'samples': 1231872, 'steps': 6415, 'loss/train': 1.9456948041915894} +11/06/2021 22:09:03 - INFO - __main__ - Step 6417: {'lr': 0.000498902444662376, 'samples': 1232064, 'steps': 6416, 'loss/train': 2.429739475250244} +11/06/2021 22:09:04 - INFO - __main__ - Step 6418: {'lr': 0.0004989019478891144, 'samples': 1232256, 'steps': 6417, 'loss/train': 2.0660645961761475} +11/06/2021 22:09:04 - INFO - __main__ - Step 6419: {'lr': 0.0004989014510037013, 'samples': 1232448, 'steps': 6418, 'loss/train': 1.0096818208694458} +11/06/2021 22:09:05 - INFO - __main__ - Step 6420: {'lr': 0.0004989009540061373, 'samples': 1232640, 'steps': 6419, 'loss/train': 1.7009047269821167} +11/06/2021 22:09:05 - INFO - __main__ - Step 6421: {'lr': 0.0004989004568964221, 'samples': 1232832, 'steps': 6420, 'loss/train': 1.8998950719833374} +11/06/2021 22:09:06 - INFO - __main__ - Step 6422: {'lr': 0.0004988999596745562, 'samples': 1233024, 'steps': 6421, 'loss/train': 2.2160139083862305} +11/06/2021 22:09:06 - INFO - __main__ - Step 6423: {'lr': 0.00049889946234054, 'samples': 1233216, 'steps': 6422, 'loss/train': 1.466779351234436} +11/06/2021 22:09:07 - INFO - __main__ - Step 6424: {'lr': 0.0004988989648943734, 'samples': 1233408, 'steps': 6423, 'loss/train': 1.9524688720703125} +11/06/2021 22:09:08 - INFO - __main__ - Step 6425: {'lr': 0.0004988984673360568, 'samples': 1233600, 'steps': 6424, 'loss/train': 1.4690804481506348} +11/06/2021 22:09:08 - INFO - __main__ - Step 6426: {'lr': 0.0004988979696655904, 'samples': 1233792, 'steps': 6425, 'loss/train': 1.6141606569290161} +11/06/2021 22:09:08 - INFO - __main__ - Step 6427: {'lr': 0.0004988974718829744, 'samples': 1233984, 'steps': 6426, 'loss/train': 1.9417755603790283} +11/06/2021 22:09:09 - INFO - __main__ - Step 6428: {'lr': 0.0004988969739882091, 'samples': 1234176, 'steps': 6427, 'loss/train': 1.8715691566467285} +11/06/2021 22:09:09 - INFO - __main__ - Step 6429: {'lr': 0.0004988964759812946, 'samples': 1234368, 'steps': 6428, 'loss/train': 1.668321132659912} +11/06/2021 22:09:11 - INFO - __main__ - Step 6430: {'lr': 0.0004988959778622313, 'samples': 1234560, 'steps': 6429, 'loss/train': 1.9378490447998047} +11/06/2021 22:09:11 - INFO - __main__ - Step 6431: {'lr': 0.0004988954796310191, 'samples': 1234752, 'steps': 6430, 'loss/train': 1.9765774011611938} +11/06/2021 22:09:12 - INFO - __main__ - Step 6432: {'lr': 0.0004988949812876586, 'samples': 1234944, 'steps': 6431, 'loss/train': 1.7189645767211914} +11/06/2021 22:09:12 - INFO - __main__ - Step 6433: {'lr': 0.0004988944828321499, 'samples': 1235136, 'steps': 6432, 'loss/train': 1.8814183473587036} +11/06/2021 22:09:12 - INFO - __main__ - Step 6434: {'lr': 0.0004988939842644931, 'samples': 1235328, 'steps': 6433, 'loss/train': 1.60706627368927} +11/06/2021 22:09:13 - INFO - __main__ - Step 6435: {'lr': 0.0004988934855846885, 'samples': 1235520, 'steps': 6434, 'loss/train': 1.5853242874145508} +11/06/2021 22:09:13 - INFO - __main__ - Step 6436: {'lr': 0.0004988929867927363, 'samples': 1235712, 'steps': 6435, 'loss/train': 1.9436169862747192} +11/06/2021 22:09:13 - INFO - __main__ - Step 6437: {'lr': 0.0004988924878886368, 'samples': 1235904, 'steps': 6436, 'loss/train': 1.9640707969665527} +11/06/2021 22:09:15 - INFO - __main__ - Step 6438: {'lr': 0.0004988919888723902, 'samples': 1236096, 'steps': 6437, 'loss/train': 1.9225521087646484} +11/06/2021 22:09:15 - INFO - __main__ - Step 6439: {'lr': 0.0004988914897439968, 'samples': 1236288, 'steps': 6438, 'loss/train': 1.5273348093032837} +11/06/2021 22:09:15 - INFO - __main__ - Step 6440: {'lr': 0.0004988909905034566, 'samples': 1236480, 'steps': 6439, 'loss/train': 1.8240584135055542} +11/06/2021 22:09:16 - INFO - __main__ - Step 6441: {'lr': 0.00049889049115077, 'samples': 1236672, 'steps': 6440, 'loss/train': 1.741806983947754} +11/06/2021 22:09:16 - INFO - __main__ - Step 6442: {'lr': 0.0004988899916859372, 'samples': 1236864, 'steps': 6441, 'loss/train': 2.750673294067383} +11/06/2021 22:09:17 - INFO - __main__ - Step 6443: {'lr': 0.0004988894921089584, 'samples': 1237056, 'steps': 6442, 'loss/train': 1.7780988216400146} +11/06/2021 22:09:17 - INFO - __main__ - Step 6444: {'lr': 0.0004988889924198339, 'samples': 1237248, 'steps': 6443, 'loss/train': 1.9567726850509644} +11/06/2021 22:09:18 - INFO - __main__ - Step 6445: {'lr': 0.0004988884926185637, 'samples': 1237440, 'steps': 6444, 'loss/train': 1.8130319118499756} +11/06/2021 22:09:18 - INFO - __main__ - Step 6446: {'lr': 0.0004988879927051484, 'samples': 1237632, 'steps': 6445, 'loss/train': 1.573569655418396} +11/06/2021 22:09:18 - INFO - __main__ - Step 6447: {'lr': 0.0004988874926795878, 'samples': 1237824, 'steps': 6446, 'loss/train': 1.8743444681167603} +11/06/2021 22:09:19 - INFO - __main__ - Step 6448: {'lr': 0.0004988869925418825, 'samples': 1238016, 'steps': 6447, 'loss/train': 1.5253403186798096} +11/06/2021 22:09:20 - INFO - __main__ - Step 6449: {'lr': 0.0004988864922920325, 'samples': 1238208, 'steps': 6448, 'loss/train': 1.7076308727264404} +11/06/2021 22:09:20 - INFO - __main__ - Step 6450: {'lr': 0.000498885991930038, 'samples': 1238400, 'steps': 6449, 'loss/train': 2.227938413619995} +11/06/2021 22:09:20 - INFO - __main__ - Step 6451: {'lr': 0.0004988854914558994, 'samples': 1238592, 'steps': 6450, 'loss/train': 1.7760518789291382} +11/06/2021 22:09:21 - INFO - __main__ - Step 6452: {'lr': 0.0004988849908696169, 'samples': 1238784, 'steps': 6451, 'loss/train': 2.213900566101074} +11/06/2021 22:09:21 - INFO - __main__ - Step 6453: {'lr': 0.0004988844901711905, 'samples': 1238976, 'steps': 6452, 'loss/train': 2.0823049545288086} +11/06/2021 22:09:22 - INFO - __main__ - Step 6454: {'lr': 0.0004988839893606208, 'samples': 1239168, 'steps': 6453, 'loss/train': 1.9034770727157593} +11/06/2021 22:09:23 - INFO - __main__ - Step 6455: {'lr': 0.0004988834884379076, 'samples': 1239360, 'steps': 6454, 'loss/train': 1.2255651950836182} +11/06/2021 22:09:23 - INFO - __main__ - Step 6456: {'lr': 0.0004988829874030514, 'samples': 1239552, 'steps': 6455, 'loss/train': 2.5880677700042725} +11/06/2021 22:09:23 - INFO - __main__ - Step 6457: {'lr': 0.0004988824862560525, 'samples': 1239744, 'steps': 6456, 'loss/train': 4.904447078704834} +11/06/2021 22:09:24 - INFO - __main__ - Step 6458: {'lr': 0.0004988819849969109, 'samples': 1239936, 'steps': 6457, 'loss/train': 1.9330166578292847} +11/06/2021 22:09:25 - INFO - __main__ - Step 6459: {'lr': 0.0004988814836256269, 'samples': 1240128, 'steps': 6458, 'loss/train': 1.4734045267105103} +11/06/2021 22:09:25 - INFO - __main__ - Step 6460: {'lr': 0.0004988809821422008, 'samples': 1240320, 'steps': 6459, 'loss/train': 2.5002269744873047} +11/06/2021 22:09:25 - INFO - __main__ - Step 6461: {'lr': 0.0004988804805466327, 'samples': 1240512, 'steps': 6460, 'loss/train': 1.7648297548294067} +11/06/2021 22:09:26 - INFO - __main__ - Step 6462: {'lr': 0.000498879978838923, 'samples': 1240704, 'steps': 6461, 'loss/train': 2.2282261848449707} +11/06/2021 22:09:26 - INFO - __main__ - Step 6463: {'lr': 0.0004988794770190717, 'samples': 1240896, 'steps': 6462, 'loss/train': 2.106597661972046} +11/06/2021 22:09:27 - INFO - __main__ - Step 6464: {'lr': 0.0004988789750870792, 'samples': 1241088, 'steps': 6463, 'loss/train': 2.194019317626953} +11/06/2021 22:09:28 - INFO - __main__ - Step 6465: {'lr': 0.0004988784730429457, 'samples': 1241280, 'steps': 6464, 'loss/train': 2.4788918495178223} +11/06/2021 22:09:28 - INFO - __main__ - Step 6466: {'lr': 0.0004988779708866714, 'samples': 1241472, 'steps': 6465, 'loss/train': 2.1936397552490234} +11/06/2021 22:09:28 - INFO - __main__ - Step 6467: {'lr': 0.0004988774686182564, 'samples': 1241664, 'steps': 6466, 'loss/train': 1.6836004257202148} +11/06/2021 22:09:29 - INFO - __main__ - Step 6468: {'lr': 0.0004988769662377013, 'samples': 1241856, 'steps': 6467, 'loss/train': 2.2871172428131104} +11/06/2021 22:09:29 - INFO - __main__ - Step 6469: {'lr': 0.0004988764637450058, 'samples': 1242048, 'steps': 6468, 'loss/train': 2.1349170207977295} +11/06/2021 22:09:30 - INFO - __main__ - Step 6470: {'lr': 0.0004988759611401706, 'samples': 1242240, 'steps': 6469, 'loss/train': 2.350022315979004} +11/06/2021 22:09:30 - INFO - __main__ - Step 6471: {'lr': 0.0004988754584231957, 'samples': 1242432, 'steps': 6470, 'loss/train': 1.986899971961975} +11/06/2021 22:09:31 - INFO - __main__ - Step 6472: {'lr': 0.0004988749555940814, 'samples': 1242624, 'steps': 6471, 'loss/train': 1.6348545551300049} +11/06/2021 22:09:31 - INFO - __main__ - Step 6473: {'lr': 0.0004988744526528277, 'samples': 1242816, 'steps': 6472, 'loss/train': 2.23770809173584} +11/06/2021 22:09:31 - INFO - __main__ - Step 6474: {'lr': 0.0004988739495994352, 'samples': 1243008, 'steps': 6473, 'loss/train': 1.4470930099487305} +11/06/2021 22:09:32 - INFO - __main__ - Step 6475: {'lr': 0.0004988734464339038, 'samples': 1243200, 'steps': 6474, 'loss/train': 1.8867287635803223} +11/06/2021 22:09:33 - INFO - __main__ - Step 6476: {'lr': 0.0004988729431562339, 'samples': 1243392, 'steps': 6475, 'loss/train': 2.184319496154785} +11/06/2021 22:09:33 - INFO - __main__ - Step 6477: {'lr': 0.0004988724397664258, 'samples': 1243584, 'steps': 6476, 'loss/train': 2.0487940311431885} +11/06/2021 22:09:33 - INFO - __main__ - Step 6478: {'lr': 0.0004988719362644795, 'samples': 1243776, 'steps': 6477, 'loss/train': 2.7399888038635254} +11/06/2021 22:09:34 - INFO - __main__ - Step 6479: {'lr': 0.0004988714326503953, 'samples': 1243968, 'steps': 6478, 'loss/train': 1.4962778091430664} +11/06/2021 22:09:35 - INFO - __main__ - Step 6480: {'lr': 0.0004988709289241736, 'samples': 1244160, 'steps': 6479, 'loss/train': 2.1878020763397217} +11/06/2021 22:09:35 - INFO - __main__ - Step 6481: {'lr': 0.0004988704250858145, 'samples': 1244352, 'steps': 6480, 'loss/train': 1.851172685623169} +11/06/2021 22:09:36 - INFO - __main__ - Step 6482: {'lr': 0.0004988699211353182, 'samples': 1244544, 'steps': 6481, 'loss/train': 1.0221189260482788} +11/06/2021 22:09:36 - INFO - __main__ - Step 6483: {'lr': 0.000498869417072685, 'samples': 1244736, 'steps': 6482, 'loss/train': 1.667419672012329} +11/06/2021 22:09:36 - INFO - __main__ - Step 6484: {'lr': 0.000498868912897915, 'samples': 1244928, 'steps': 6483, 'loss/train': 1.5354762077331543} +11/06/2021 22:09:37 - INFO - __main__ - Step 6485: {'lr': 0.0004988684086110085, 'samples': 1245120, 'steps': 6484, 'loss/train': 1.7448598146438599} +11/06/2021 22:09:38 - INFO - __main__ - Step 6486: {'lr': 0.0004988679042119658, 'samples': 1245312, 'steps': 6485, 'loss/train': 1.7529888153076172} +11/06/2021 22:09:38 - INFO - __main__ - Step 6487: {'lr': 0.000498867399700787, 'samples': 1245504, 'steps': 6486, 'loss/train': 2.0920798778533936} +11/06/2021 22:09:38 - INFO - __main__ - Step 6488: {'lr': 0.0004988668950774724, 'samples': 1245696, 'steps': 6487, 'loss/train': 2.620828151702881} +11/06/2021 22:09:39 - INFO - __main__ - Step 6489: {'lr': 0.0004988663903420222, 'samples': 1245888, 'steps': 6488, 'loss/train': 2.216024398803711} +11/06/2021 22:09:39 - INFO - __main__ - Step 6490: {'lr': 0.0004988658854944367, 'samples': 1246080, 'steps': 6489, 'loss/train': 2.130100727081299} +11/06/2021 22:09:40 - INFO - __main__ - Step 6491: {'lr': 0.0004988653805347161, 'samples': 1246272, 'steps': 6490, 'loss/train': 1.8137882947921753} +11/06/2021 22:09:40 - INFO - __main__ - Step 6492: {'lr': 0.0004988648754628605, 'samples': 1246464, 'steps': 6491, 'loss/train': 1.7981539964675903} +11/06/2021 22:09:41 - INFO - __main__ - Step 6493: {'lr': 0.0004988643702788703, 'samples': 1246656, 'steps': 6492, 'loss/train': 2.0300815105438232} +11/06/2021 22:09:41 - INFO - __main__ - Step 6494: {'lr': 0.0004988638649827456, 'samples': 1246848, 'steps': 6493, 'loss/train': 2.65700101852417} +11/06/2021 22:09:41 - INFO - __main__ - Step 6495: {'lr': 0.0004988633595744867, 'samples': 1247040, 'steps': 6494, 'loss/train': 2.369478940963745} +11/06/2021 22:09:43 - INFO - __main__ - Step 6496: {'lr': 0.0004988628540540939, 'samples': 1247232, 'steps': 6495, 'loss/train': 1.5928741693496704} +11/06/2021 22:09:43 - INFO - __main__ - Step 6497: {'lr': 0.0004988623484215673, 'samples': 1247424, 'steps': 6496, 'loss/train': 0.6462783217430115} +11/06/2021 22:09:43 - INFO - __main__ - Step 6498: {'lr': 0.0004988618426769071, 'samples': 1247616, 'steps': 6497, 'loss/train': 1.936950922012329} +11/06/2021 22:09:44 - INFO - __main__ - Step 6499: {'lr': 0.0004988613368201135, 'samples': 1247808, 'steps': 6498, 'loss/train': 2.1868393421173096} +11/06/2021 22:09:44 - INFO - __main__ - Step 6500: {'lr': 0.0004988608308511871, 'samples': 1248000, 'steps': 6499, 'loss/train': 1.6641846895217896} +11/06/2021 22:09:45 - INFO - __main__ - Step 6501: {'lr': 0.0004988603247701276, 'samples': 1248192, 'steps': 6500, 'loss/train': 1.803402066230774} +11/06/2021 22:09:45 - INFO - __main__ - Step 6502: {'lr': 0.0004988598185769357, 'samples': 1248384, 'steps': 6501, 'loss/train': 2.2652242183685303} +11/06/2021 22:09:46 - INFO - __main__ - Step 6503: {'lr': 0.0004988593122716112, 'samples': 1248576, 'steps': 6502, 'loss/train': 1.5960944890975952} +11/06/2021 22:09:46 - INFO - __main__ - Step 6504: {'lr': 0.0004988588058541547, 'samples': 1248768, 'steps': 6503, 'loss/train': 1.9997038841247559} +11/06/2021 22:09:46 - INFO - __main__ - Step 6505: {'lr': 0.0004988582993245661, 'samples': 1248960, 'steps': 6504, 'loss/train': 2.119647264480591} +11/06/2021 22:09:47 - INFO - __main__ - Step 6506: {'lr': 0.0004988577926828459, 'samples': 1249152, 'steps': 6505, 'loss/train': 1.9104197025299072} +11/06/2021 22:09:48 - INFO - __main__ - Step 6507: {'lr': 0.0004988572859289941, 'samples': 1249344, 'steps': 6506, 'loss/train': 0.5368994474411011} +11/06/2021 22:09:48 - INFO - __main__ - Step 6508: {'lr': 0.0004988567790630111, 'samples': 1249536, 'steps': 6507, 'loss/train': 1.2611361742019653} +11/06/2021 22:09:48 - INFO - __main__ - Step 6509: {'lr': 0.0004988562720848973, 'samples': 1249728, 'steps': 6508, 'loss/train': 2.310293674468994} +11/06/2021 22:09:49 - INFO - __main__ - Step 6510: {'lr': 0.0004988557649946525, 'samples': 1249920, 'steps': 6509, 'loss/train': 1.3652870655059814} +11/06/2021 22:09:50 - INFO - __main__ - Step 6511: {'lr': 0.000498855257792277, 'samples': 1250112, 'steps': 6510, 'loss/train': 2.2352139949798584} +11/06/2021 22:09:50 - INFO - __main__ - Step 6512: {'lr': 0.0004988547504777714, 'samples': 1250304, 'steps': 6511, 'loss/train': 1.4359506368637085} +11/06/2021 22:09:50 - INFO - __main__ - Step 6513: {'lr': 0.0004988542430511356, 'samples': 1250496, 'steps': 6512, 'loss/train': 2.3191769123077393} +11/06/2021 22:09:51 - INFO - __main__ - Step 6514: {'lr': 0.0004988537355123699, 'samples': 1250688, 'steps': 6513, 'loss/train': 2.3833720684051514} +11/06/2021 22:09:51 - INFO - __main__ - Step 6515: {'lr': 0.0004988532278614745, 'samples': 1250880, 'steps': 6514, 'loss/train': 1.4373453855514526} +11/06/2021 22:09:52 - INFO - __main__ - Step 6516: {'lr': 0.0004988527200984498, 'samples': 1251072, 'steps': 6515, 'loss/train': 1.5178534984588623} +11/06/2021 22:09:52 - INFO - __main__ - Step 6517: {'lr': 0.0004988522122232958, 'samples': 1251264, 'steps': 6516, 'loss/train': 1.9620566368103027} +11/06/2021 22:09:53 - INFO - __main__ - Step 6518: {'lr': 0.0004988517042360128, 'samples': 1251456, 'steps': 6517, 'loss/train': 1.9547860622406006} +11/06/2021 22:09:53 - INFO - __main__ - Step 6519: {'lr': 0.0004988511961366012, 'samples': 1251648, 'steps': 6518, 'loss/train': 5.9194560050964355} +11/06/2021 22:09:54 - INFO - __main__ - Step 6520: {'lr': 0.000498850687925061, 'samples': 1251840, 'steps': 6519, 'loss/train': 2.1525418758392334} +11/06/2021 22:09:54 - INFO - __main__ - Step 6521: {'lr': 0.0004988501796013926, 'samples': 1252032, 'steps': 6520, 'loss/train': 1.9909714460372925} +11/06/2021 22:09:55 - INFO - __main__ - Step 6522: {'lr': 0.0004988496711655961, 'samples': 1252224, 'steps': 6521, 'loss/train': 1.5848283767700195} +11/06/2021 22:09:55 - INFO - __main__ - Step 6523: {'lr': 0.0004988491626176718, 'samples': 1252416, 'steps': 6522, 'loss/train': 1.9467501640319824} +11/06/2021 22:09:56 - INFO - __main__ - Step 6524: {'lr': 0.0004988486539576198, 'samples': 1252608, 'steps': 6523, 'loss/train': 2.0624489784240723} +11/06/2021 22:09:56 - INFO - __main__ - Step 6525: {'lr': 0.0004988481451854406, 'samples': 1252800, 'steps': 6524, 'loss/train': 1.9637494087219238} +11/06/2021 22:09:56 - INFO - __main__ - Step 6526: {'lr': 0.0004988476363011341, 'samples': 1252992, 'steps': 6525, 'loss/train': 2.017069101333618} +11/06/2021 22:09:57 - INFO - __main__ - Step 6527: {'lr': 0.0004988471273047008, 'samples': 1253184, 'steps': 6526, 'loss/train': 1.8356379270553589} +11/06/2021 22:09:58 - INFO - __main__ - Step 6528: {'lr': 0.0004988466181961408, 'samples': 1253376, 'steps': 6527, 'loss/train': 1.6690013408660889} +11/06/2021 22:09:58 - INFO - __main__ - Step 6529: {'lr': 0.0004988461089754544, 'samples': 1253568, 'steps': 6528, 'loss/train': 1.86026930809021} +11/06/2021 22:09:58 - INFO - __main__ - Step 6530: {'lr': 0.0004988455996426418, 'samples': 1253760, 'steps': 6529, 'loss/train': 1.9897722005844116} +11/06/2021 22:09:59 - INFO - __main__ - Step 6531: {'lr': 0.0004988450901977031, 'samples': 1253952, 'steps': 6530, 'loss/train': 2.079590082168579} +11/06/2021 22:10:00 - INFO - __main__ - Step 6532: {'lr': 0.0004988445806406387, 'samples': 1254144, 'steps': 6531, 'loss/train': 3.077930212020874} +11/06/2021 22:10:00 - INFO - __main__ - Step 6533: {'lr': 0.0004988440709714487, 'samples': 1254336, 'steps': 6532, 'loss/train': 2.232908010482788} +11/06/2021 22:10:01 - INFO - __main__ - Step 6534: {'lr': 0.0004988435611901335, 'samples': 1254528, 'steps': 6533, 'loss/train': 1.569143533706665} +11/06/2021 22:10:01 - INFO - __main__ - Step 6535: {'lr': 0.0004988430512966932, 'samples': 1254720, 'steps': 6534, 'loss/train': 2.3683085441589355} +11/06/2021 22:10:01 - INFO - __main__ - Step 6536: {'lr': 0.000498842541291128, 'samples': 1254912, 'steps': 6535, 'loss/train': 1.7087137699127197} +11/06/2021 22:10:02 - INFO - __main__ - Step 6537: {'lr': 0.0004988420311734383, 'samples': 1255104, 'steps': 6536, 'loss/train': 2.1297061443328857} +11/06/2021 22:10:03 - INFO - __main__ - Step 6538: {'lr': 0.0004988415209436243, 'samples': 1255296, 'steps': 6537, 'loss/train': 1.857115387916565} +11/06/2021 22:10:03 - INFO - __main__ - Step 6539: {'lr': 0.000498841010601686, 'samples': 1255488, 'steps': 6538, 'loss/train': 2.037982225418091} +11/06/2021 22:10:03 - INFO - __main__ - Step 6540: {'lr': 0.0004988405001476237, 'samples': 1255680, 'steps': 6539, 'loss/train': 2.1346702575683594} +11/06/2021 22:10:04 - INFO - __main__ - Step 6541: {'lr': 0.0004988399895814378, 'samples': 1255872, 'steps': 6540, 'loss/train': 1.6024067401885986} +11/06/2021 22:10:05 - INFO - __main__ - Step 6542: {'lr': 0.0004988394789031286, 'samples': 1256064, 'steps': 6541, 'loss/train': 2.4668922424316406} +11/06/2021 22:10:05 - INFO - __main__ - Step 6543: {'lr': 0.000498838968112696, 'samples': 1256256, 'steps': 6542, 'loss/train': 1.6090011596679688} +11/06/2021 22:10:05 - INFO - __main__ - Step 6544: {'lr': 0.0004988384572101403, 'samples': 1256448, 'steps': 6543, 'loss/train': 1.8808883428573608} +11/06/2021 22:10:06 - INFO - __main__ - Step 6545: {'lr': 0.000498837946195462, 'samples': 1256640, 'steps': 6544, 'loss/train': 1.728848934173584} +11/06/2021 22:10:06 - INFO - __main__ - Step 6546: {'lr': 0.0004988374350686611, 'samples': 1256832, 'steps': 6545, 'loss/train': 1.9686365127563477} +11/06/2021 22:10:07 - INFO - __main__ - Step 6547: {'lr': 0.000498836923829738, 'samples': 1257024, 'steps': 6546, 'loss/train': 1.8499354124069214} +11/06/2021 22:10:07 - INFO - __main__ - Step 6548: {'lr': 0.0004988364124786927, 'samples': 1257216, 'steps': 6547, 'loss/train': 1.4615224599838257} +11/06/2021 22:10:08 - INFO - __main__ - Step 6549: {'lr': 0.0004988359010155255, 'samples': 1257408, 'steps': 6548, 'loss/train': 1.7403419017791748} +11/06/2021 22:10:08 - INFO - __main__ - Step 6550: {'lr': 0.0004988353894402368, 'samples': 1257600, 'steps': 6549, 'loss/train': 1.965841293334961} +11/06/2021 22:10:09 - INFO - __main__ - Step 6551: {'lr': 0.0004988348777528267, 'samples': 1257792, 'steps': 6550, 'loss/train': 2.171156883239746} +11/06/2021 22:10:09 - INFO - __main__ - Step 6552: {'lr': 0.0004988343659532954, 'samples': 1257984, 'steps': 6551, 'loss/train': 2.217395782470703} +11/06/2021 22:10:10 - INFO - __main__ - Step 6553: {'lr': 0.0004988338540416432, 'samples': 1258176, 'steps': 6552, 'loss/train': 2.0271527767181396} +11/06/2021 22:10:10 - INFO - __main__ - Step 6554: {'lr': 0.0004988333420178704, 'samples': 1258368, 'steps': 6553, 'loss/train': 1.7768346071243286} +11/06/2021 22:10:11 - INFO - __main__ - Step 6555: {'lr': 0.000498832829881977, 'samples': 1258560, 'steps': 6554, 'loss/train': 2.1017751693725586} +11/06/2021 22:10:11 - INFO - __main__ - Step 6556: {'lr': 0.0004988323176339633, 'samples': 1258752, 'steps': 6555, 'loss/train': 1.467564582824707} +11/06/2021 22:10:11 - INFO - __main__ - Step 6557: {'lr': 0.0004988318052738298, 'samples': 1258944, 'steps': 6556, 'loss/train': 1.9192558526992798} +11/06/2021 22:10:12 - INFO - __main__ - Step 6558: {'lr': 0.0004988312928015763, 'samples': 1259136, 'steps': 6557, 'loss/train': 1.927575945854187} +11/06/2021 22:10:13 - INFO - __main__ - Step 6559: {'lr': 0.0004988307802172035, 'samples': 1259328, 'steps': 6558, 'loss/train': 2.1528429985046387} +11/06/2021 22:10:13 - INFO - __main__ - Step 6560: {'lr': 0.0004988302675207112, 'samples': 1259520, 'steps': 6559, 'loss/train': 2.317401170730591} +11/06/2021 22:10:13 - INFO - __main__ - Step 6561: {'lr': 0.0004988297547121, 'samples': 1259712, 'steps': 6560, 'loss/train': 1.843315839767456} +11/06/2021 22:10:14 - INFO - __main__ - Step 6562: {'lr': 0.0004988292417913698, 'samples': 1259904, 'steps': 6561, 'loss/train': 2.109565019607544} +11/06/2021 22:10:15 - INFO - __main__ - Step 6563: {'lr': 0.0004988287287585211, 'samples': 1260096, 'steps': 6562, 'loss/train': 0.9284586906433105} +11/06/2021 22:10:15 - INFO - __main__ - Step 6564: {'lr': 0.0004988282156135539, 'samples': 1260288, 'steps': 6563, 'loss/train': 1.7303180694580078} +11/06/2021 22:10:15 - INFO - __main__ - Step 6565: {'lr': 0.0004988277023564685, 'samples': 1260480, 'steps': 6564, 'loss/train': 2.28778338432312} +11/06/2021 22:10:16 - INFO - __main__ - Step 6566: {'lr': 0.0004988271889872654, 'samples': 1260672, 'steps': 6565, 'loss/train': 2.138411045074463} +11/06/2021 22:10:16 - INFO - __main__ - Step 6567: {'lr': 0.0004988266755059444, 'samples': 1260864, 'steps': 6566, 'loss/train': 2.42995023727417} +11/06/2021 22:10:17 - INFO - __main__ - Step 6568: {'lr': 0.000498826161912506, 'samples': 1261056, 'steps': 6567, 'loss/train': 1.8563683032989502} +11/06/2021 22:10:17 - INFO - __main__ - Step 6569: {'lr': 0.0004988256482069505, 'samples': 1261248, 'steps': 6568, 'loss/train': 1.7521291971206665} +11/06/2021 22:10:18 - INFO - __main__ - Step 6570: {'lr': 0.0004988251343892779, 'samples': 1261440, 'steps': 6569, 'loss/train': 1.6020236015319824} +11/06/2021 22:10:18 - INFO - __main__ - Step 6571: {'lr': 0.0004988246204594885, 'samples': 1261632, 'steps': 6570, 'loss/train': 1.995780348777771} +11/06/2021 22:10:18 - INFO - __main__ - Step 6572: {'lr': 0.0004988241064175826, 'samples': 1261824, 'steps': 6571, 'loss/train': 2.2202649116516113} +11/06/2021 22:10:19 - INFO - __main__ - Step 6573: {'lr': 0.0004988235922635604, 'samples': 1262016, 'steps': 6572, 'loss/train': 2.3514225482940674} +11/06/2021 22:10:20 - INFO - __main__ - Step 6574: {'lr': 0.0004988230779974221, 'samples': 1262208, 'steps': 6573, 'loss/train': 1.9057080745697021} +11/06/2021 22:10:20 - INFO - __main__ - Step 6575: {'lr': 0.000498822563619168, 'samples': 1262400, 'steps': 6574, 'loss/train': 1.9137215614318848} +11/06/2021 22:10:21 - INFO - __main__ - Step 6576: {'lr': 0.0004988220491287983, 'samples': 1262592, 'steps': 6575, 'loss/train': 1.931260108947754} +11/06/2021 22:10:21 - INFO - __main__ - Step 6577: {'lr': 0.0004988215345263132, 'samples': 1262784, 'steps': 6576, 'loss/train': 1.774949550628662} +11/06/2021 22:10:21 - INFO - __main__ - Step 6578: {'lr': 0.0004988210198117129, 'samples': 1262976, 'steps': 6577, 'loss/train': 1.8798142671585083} +11/06/2021 22:10:22 - INFO - __main__ - Step 6579: {'lr': 0.0004988205049849978, 'samples': 1263168, 'steps': 6578, 'loss/train': 2.2597692012786865} +11/06/2021 22:10:23 - INFO - __main__ - Step 6580: {'lr': 0.0004988199900461679, 'samples': 1263360, 'steps': 6579, 'loss/train': 2.158470869064331} +11/06/2021 22:10:23 - INFO - __main__ - Step 6581: {'lr': 0.0004988194749952237, 'samples': 1263552, 'steps': 6580, 'loss/train': 1.9333513975143433} +11/06/2021 22:10:23 - INFO - __main__ - Step 6582: {'lr': 0.0004988189598321652, 'samples': 1263744, 'steps': 6581, 'loss/train': 2.1383774280548096} +11/06/2021 22:10:24 - INFO - __main__ - Step 6583: {'lr': 0.0004988184445569926, 'samples': 1263936, 'steps': 6582, 'loss/train': 2.0251195430755615} +11/06/2021 22:10:25 - INFO - __main__ - Step 6584: {'lr': 0.0004988179291697064, 'samples': 1264128, 'steps': 6583, 'loss/train': 1.354901671409607} +11/06/2021 22:10:25 - INFO - __main__ - Step 6585: {'lr': 0.0004988174136703066, 'samples': 1264320, 'steps': 6584, 'loss/train': 1.922788381576538} +11/06/2021 22:10:25 - INFO - __main__ - Step 6586: {'lr': 0.0004988168980587936, 'samples': 1264512, 'steps': 6585, 'loss/train': 1.8145787715911865} +11/06/2021 22:10:26 - INFO - __main__ - Step 6587: {'lr': 0.0004988163823351676, 'samples': 1264704, 'steps': 6586, 'loss/train': 1.9621999263763428} +11/06/2021 22:10:26 - INFO - __main__ - Step 6588: {'lr': 0.0004988158664994286, 'samples': 1264896, 'steps': 6587, 'loss/train': 1.8063040971755981} +11/06/2021 22:10:27 - INFO - __main__ - Step 6589: {'lr': 0.0004988153505515771, 'samples': 1265088, 'steps': 6588, 'loss/train': 2.8506147861480713} +11/06/2021 22:10:28 - INFO - __main__ - Step 6590: {'lr': 0.0004988148344916133, 'samples': 1265280, 'steps': 6589, 'loss/train': 1.649754524230957} +11/06/2021 22:10:28 - INFO - __main__ - Step 6591: {'lr': 0.0004988143183195373, 'samples': 1265472, 'steps': 6590, 'loss/train': 1.709517478942871} +11/06/2021 22:10:28 - INFO - __main__ - Step 6592: {'lr': 0.0004988138020353493, 'samples': 1265664, 'steps': 6591, 'loss/train': 1.7125308513641357} +11/06/2021 22:10:29 - INFO - __main__ - Step 6593: {'lr': 0.0004988132856390498, 'samples': 1265856, 'steps': 6592, 'loss/train': 1.3303931951522827} +11/06/2021 22:10:30 - INFO - __main__ - Step 6594: {'lr': 0.0004988127691306388, 'samples': 1266048, 'steps': 6593, 'loss/train': 2.029025077819824} +11/06/2021 22:10:30 - INFO - __main__ - Step 6595: {'lr': 0.0004988122525101166, 'samples': 1266240, 'steps': 6594, 'loss/train': 1.7039332389831543} +11/06/2021 22:10:30 - INFO - __main__ - Step 6596: {'lr': 0.0004988117357774835, 'samples': 1266432, 'steps': 6595, 'loss/train': 2.2546744346618652} +11/06/2021 22:10:31 - INFO - __main__ - Step 6597: {'lr': 0.0004988112189327397, 'samples': 1266624, 'steps': 6596, 'loss/train': 2.0449981689453125} +11/06/2021 22:10:31 - INFO - __main__ - Step 6598: {'lr': 0.0004988107019758853, 'samples': 1266816, 'steps': 6597, 'loss/train': 1.963868260383606} +11/06/2021 22:10:31 - INFO - __main__ - Step 6599: {'lr': 0.0004988101849069208, 'samples': 1267008, 'steps': 6598, 'loss/train': 1.7069015502929688} +11/06/2021 22:10:32 - INFO - __main__ - Step 6600: {'lr': 0.0004988096677258461, 'samples': 1267200, 'steps': 6599, 'loss/train': 2.1868088245391846} +11/06/2021 22:10:33 - INFO - __main__ - Step 6601: {'lr': 0.0004988091504326616, 'samples': 1267392, 'steps': 6600, 'loss/train': 1.8266377449035645} +11/06/2021 22:10:33 - INFO - __main__ - Step 6602: {'lr': 0.0004988086330273676, 'samples': 1267584, 'steps': 6601, 'loss/train': 1.2428114414215088} +11/06/2021 22:10:34 - INFO - __main__ - Step 6603: {'lr': 0.0004988081155099643, 'samples': 1267776, 'steps': 6602, 'loss/train': 1.4701017141342163} +11/06/2021 22:10:34 - INFO - __main__ - Step 6604: {'lr': 0.0004988075978804518, 'samples': 1267968, 'steps': 6603, 'loss/train': 1.7105156183242798} +11/06/2021 22:10:35 - INFO - __main__ - Step 6605: {'lr': 0.0004988070801388306, 'samples': 1268160, 'steps': 6604, 'loss/train': 0.2404092252254486} +11/06/2021 22:10:35 - INFO - __main__ - Step 6606: {'lr': 0.0004988065622851006, 'samples': 1268352, 'steps': 6605, 'loss/train': 1.55886709690094} +11/06/2021 22:10:36 - INFO - __main__ - Step 6607: {'lr': 0.0004988060443192623, 'samples': 1268544, 'steps': 6606, 'loss/train': 1.470017671585083} +11/06/2021 22:10:36 - INFO - __main__ - Step 6608: {'lr': 0.0004988055262413158, 'samples': 1268736, 'steps': 6607, 'loss/train': 1.6374818086624146} +11/06/2021 22:10:36 - INFO - __main__ - Step 6609: {'lr': 0.0004988050080512614, 'samples': 1268928, 'steps': 6608, 'loss/train': 1.785929799079895} +11/06/2021 22:10:37 - INFO - __main__ - Step 6610: {'lr': 0.0004988044897490993, 'samples': 1269120, 'steps': 6609, 'loss/train': 1.8489357233047485} +11/06/2021 22:10:38 - INFO - __main__ - Step 6611: {'lr': 0.0004988039713348297, 'samples': 1269312, 'steps': 6610, 'loss/train': 2.0114858150482178} +11/06/2021 22:10:38 - INFO - __main__ - Step 6612: {'lr': 0.0004988034528084529, 'samples': 1269504, 'steps': 6611, 'loss/train': 1.6072686910629272} +11/06/2021 22:10:38 - INFO - __main__ - Step 6613: {'lr': 0.000498802934169969, 'samples': 1269696, 'steps': 6612, 'loss/train': 2.4517900943756104} +11/06/2021 22:10:39 - INFO - __main__ - Step 6614: {'lr': 0.0004988024154193785, 'samples': 1269888, 'steps': 6613, 'loss/train': 2.244598627090454} +11/06/2021 22:10:40 - INFO - __main__ - Step 6615: {'lr': 0.0004988018965566814, 'samples': 1270080, 'steps': 6614, 'loss/train': 1.5164146423339844} +11/06/2021 22:10:40 - INFO - __main__ - Step 6616: {'lr': 0.000498801377581878, 'samples': 1270272, 'steps': 6615, 'loss/train': 1.9338390827178955} +11/06/2021 22:10:40 - INFO - __main__ - Step 6617: {'lr': 0.0004988008584949686, 'samples': 1270464, 'steps': 6616, 'loss/train': 0.2597677409648895} +11/06/2021 22:10:41 - INFO - __main__ - Step 6618: {'lr': 0.0004988003392959533, 'samples': 1270656, 'steps': 6617, 'loss/train': 2.182772397994995} +11/06/2021 22:10:41 - INFO - __main__ - Step 6619: {'lr': 0.0004987998199848324, 'samples': 1270848, 'steps': 6618, 'loss/train': 1.4753804206848145} +11/06/2021 22:10:42 - INFO - __main__ - Step 6620: {'lr': 0.0004987993005616061, 'samples': 1271040, 'steps': 6619, 'loss/train': 1.8077441453933716} +11/06/2021 22:10:43 - INFO - __main__ - Step 6621: {'lr': 0.0004987987810262747, 'samples': 1271232, 'steps': 6620, 'loss/train': 0.7256439328193665} +11/06/2021 22:10:43 - INFO - __main__ - Step 6622: {'lr': 0.0004987982613788384, 'samples': 1271424, 'steps': 6621, 'loss/train': 1.808817744255066} +11/06/2021 22:10:43 - INFO - __main__ - Step 6623: {'lr': 0.0004987977416192976, 'samples': 1271616, 'steps': 6622, 'loss/train': 2.2159342765808105} +11/06/2021 22:10:44 - INFO - __main__ - Step 6624: {'lr': 0.0004987972217476523, 'samples': 1271808, 'steps': 6623, 'loss/train': 2.1314337253570557} +11/06/2021 22:10:45 - INFO - __main__ - Step 6625: {'lr': 0.0004987967017639027, 'samples': 1272000, 'steps': 6624, 'loss/train': 1.8644086122512817} +11/06/2021 22:10:45 - INFO - __main__ - Step 6626: {'lr': 0.0004987961816680492, 'samples': 1272192, 'steps': 6625, 'loss/train': 1.5684220790863037} +11/06/2021 22:10:45 - INFO - __main__ - Step 6627: {'lr': 0.000498795661460092, 'samples': 1272384, 'steps': 6626, 'loss/train': 2.122796058654785} +11/06/2021 22:10:46 - INFO - __main__ - Step 6628: {'lr': 0.0004987951411400313, 'samples': 1272576, 'steps': 6627, 'loss/train': 1.8228185176849365} +11/06/2021 22:10:46 - INFO - __main__ - Step 6629: {'lr': 0.0004987946207078674, 'samples': 1272768, 'steps': 6628, 'loss/train': 1.77996826171875} +11/06/2021 22:10:47 - INFO - __main__ - Step 6630: {'lr': 0.0004987941001636004, 'samples': 1272960, 'steps': 6629, 'loss/train': 2.308150291442871} +11/06/2021 22:10:47 - INFO - __main__ - Step 6631: {'lr': 0.0004987935795072307, 'samples': 1273152, 'steps': 6630, 'loss/train': 1.8831443786621094} +11/06/2021 22:10:48 - INFO - __main__ - Step 6632: {'lr': 0.0004987930587387584, 'samples': 1273344, 'steps': 6631, 'loss/train': 2.2510716915130615} +11/06/2021 22:10:48 - INFO - __main__ - Step 6633: {'lr': 0.0004987925378581838, 'samples': 1273536, 'steps': 6632, 'loss/train': 1.590349793434143} +11/06/2021 22:10:48 - INFO - __main__ - Step 6634: {'lr': 0.0004987920168655071, 'samples': 1273728, 'steps': 6633, 'loss/train': 1.4046695232391357} +11/06/2021 22:10:49 - INFO - __main__ - Step 6635: {'lr': 0.0004987914957607286, 'samples': 1273920, 'steps': 6634, 'loss/train': 2.134047746658325} +11/06/2021 22:10:50 - INFO - __main__ - Step 6636: {'lr': 0.0004987909745438484, 'samples': 1274112, 'steps': 6635, 'loss/train': 1.8218518495559692} +11/06/2021 22:10:50 - INFO - __main__ - Step 6637: {'lr': 0.000498790453214867, 'samples': 1274304, 'steps': 6636, 'loss/train': 2.182149648666382} +11/06/2021 22:10:51 - INFO - __main__ - Step 6638: {'lr': 0.0004987899317737843, 'samples': 1274496, 'steps': 6637, 'loss/train': 2.091320753097534} +11/06/2021 22:10:51 - INFO - __main__ - Step 6639: {'lr': 0.0004987894102206008, 'samples': 1274688, 'steps': 6638, 'loss/train': 1.5049811601638794} +11/06/2021 22:10:51 - INFO - __main__ - Step 6640: {'lr': 0.0004987888885553166, 'samples': 1274880, 'steps': 6639, 'loss/train': 2.0964086055755615} +11/06/2021 22:10:52 - INFO - __main__ - Step 6641: {'lr': 0.0004987883667779319, 'samples': 1275072, 'steps': 6640, 'loss/train': 0.3089179992675781} +11/06/2021 22:10:53 - INFO - __main__ - Step 6642: {'lr': 0.0004987878448884471, 'samples': 1275264, 'steps': 6641, 'loss/train': 1.5907493829727173} +11/06/2021 22:10:53 - INFO - __main__ - Step 6643: {'lr': 0.0004987873228868622, 'samples': 1275456, 'steps': 6642, 'loss/train': 1.9820168018341064} +11/06/2021 22:10:53 - INFO - __main__ - Step 6644: {'lr': 0.0004987868007731778, 'samples': 1275648, 'steps': 6643, 'loss/train': 1.0979185104370117} +11/06/2021 22:10:54 - INFO - __main__ - Step 6645: {'lr': 0.0004987862785473937, 'samples': 1275840, 'steps': 6644, 'loss/train': 1.9548885822296143} +11/06/2021 22:10:55 - INFO - __main__ - Step 6646: {'lr': 0.0004987857562095103, 'samples': 1276032, 'steps': 6645, 'loss/train': 1.8669013977050781} +11/06/2021 22:10:55 - INFO - __main__ - Step 6647: {'lr': 0.0004987852337595281, 'samples': 1276224, 'steps': 6646, 'loss/train': 1.6619402170181274} +11/06/2021 22:10:55 - INFO - __main__ - Step 6648: {'lr': 0.0004987847111974469, 'samples': 1276416, 'steps': 6647, 'loss/train': 1.4700028896331787} +11/06/2021 22:10:56 - INFO - __main__ - Step 6649: {'lr': 0.0004987841885232674, 'samples': 1276608, 'steps': 6648, 'loss/train': 1.8722918033599854} +11/06/2021 22:10:56 - INFO - __main__ - Step 6650: {'lr': 0.0004987836657369893, 'samples': 1276800, 'steps': 6649, 'loss/train': 2.425621271133423} +11/06/2021 22:10:57 - INFO - __main__ - Step 6651: {'lr': 0.0004987831428386133, 'samples': 1276992, 'steps': 6650, 'loss/train': 1.4940102100372314} +11/06/2021 22:10:58 - INFO - __main__ - Step 6652: {'lr': 0.0004987826198281394, 'samples': 1277184, 'steps': 6651, 'loss/train': 1.6286990642547607} +11/06/2021 22:10:58 - INFO - __main__ - Step 6653: {'lr': 0.0004987820967055678, 'samples': 1277376, 'steps': 6652, 'loss/train': 1.9754180908203125} +11/06/2021 22:10:58 - INFO - __main__ - Step 6654: {'lr': 0.000498781573470899, 'samples': 1277568, 'steps': 6653, 'loss/train': 2.209815502166748} +11/06/2021 22:10:59 - INFO - __main__ - Step 6655: {'lr': 0.000498781050124133, 'samples': 1277760, 'steps': 6654, 'loss/train': 2.132535934448242} +11/06/2021 22:11:00 - INFO - __main__ - Step 6656: {'lr': 0.0004987805266652701, 'samples': 1277952, 'steps': 6655, 'loss/train': 1.9133520126342773} +11/06/2021 22:11:00 - INFO - __main__ - Step 6657: {'lr': 0.0004987800030943105, 'samples': 1278144, 'steps': 6656, 'loss/train': 1.6376458406448364} +11/06/2021 22:11:00 - INFO - __main__ - Step 6658: {'lr': 0.0004987794794112545, 'samples': 1278336, 'steps': 6657, 'loss/train': 1.9937931299209595} +11/06/2021 22:11:01 - INFO - __main__ - Step 6659: {'lr': 0.0004987789556161022, 'samples': 1278528, 'steps': 6658, 'loss/train': 0.2782423198223114} +11/06/2021 22:11:01 - INFO - __main__ - Step 6660: {'lr': 0.0004987784317088541, 'samples': 1278720, 'steps': 6659, 'loss/train': 1.6906732320785522} +11/06/2021 22:11:02 - INFO - __main__ - Step 6661: {'lr': 0.0004987779076895102, 'samples': 1278912, 'steps': 6660, 'loss/train': 2.3083863258361816} +11/06/2021 22:11:03 - INFO - __main__ - Step 6662: {'lr': 0.0004987773835580708, 'samples': 1279104, 'steps': 6661, 'loss/train': 1.6070939302444458} +11/06/2021 22:11:03 - INFO - __main__ - Step 6663: {'lr': 0.0004987768593145362, 'samples': 1279296, 'steps': 6662, 'loss/train': 1.7183184623718262} +11/06/2021 22:11:03 - INFO - __main__ - Step 6664: {'lr': 0.0004987763349589065, 'samples': 1279488, 'steps': 6663, 'loss/train': 1.628963828086853} +11/06/2021 22:11:04 - INFO - __main__ - Step 6665: {'lr': 0.0004987758104911821, 'samples': 1279680, 'steps': 6664, 'loss/train': 1.9477825164794922} +11/06/2021 22:11:05 - INFO - __main__ - Step 6666: {'lr': 0.0004987752859113631, 'samples': 1279872, 'steps': 6665, 'loss/train': 1.3619539737701416} +11/06/2021 22:11:05 - INFO - __main__ - Step 6667: {'lr': 0.0004987747612194499, 'samples': 1280064, 'steps': 6666, 'loss/train': 1.2572715282440186} +11/06/2021 22:11:05 - INFO - __main__ - Step 6668: {'lr': 0.0004987742364154425, 'samples': 1280256, 'steps': 6667, 'loss/train': 2.365995407104492} +11/06/2021 22:11:06 - INFO - __main__ - Step 6669: {'lr': 0.0004987737114993413, 'samples': 1280448, 'steps': 6668, 'loss/train': 1.940123438835144} +11/06/2021 22:11:06 - INFO - __main__ - Step 6670: {'lr': 0.0004987731864711466, 'samples': 1280640, 'steps': 6669, 'loss/train': 1.1229156255722046} +11/06/2021 22:11:07 - INFO - __main__ - Step 6671: {'lr': 0.0004987726613308584, 'samples': 1280832, 'steps': 6670, 'loss/train': 1.7459203004837036} +11/06/2021 22:11:07 - INFO - __main__ - Step 6672: {'lr': 0.0004987721360784772, 'samples': 1281024, 'steps': 6671, 'loss/train': 1.6915955543518066} +11/06/2021 22:11:08 - INFO - __main__ - Step 6673: {'lr': 0.0004987716107140031, 'samples': 1281216, 'steps': 6672, 'loss/train': 2.0414986610412598} +11/06/2021 22:11:08 - INFO - __main__ - Step 6674: {'lr': 0.0004987710852374363, 'samples': 1281408, 'steps': 6673, 'loss/train': 2.4011054039001465} +11/06/2021 22:11:08 - INFO - __main__ - Step 6675: {'lr': 0.0004987705596487771, 'samples': 1281600, 'steps': 6674, 'loss/train': 1.3550761938095093} +11/06/2021 22:11:09 - INFO - __main__ - Step 6676: {'lr': 0.0004987700339480258, 'samples': 1281792, 'steps': 6675, 'loss/train': 1.6839749813079834} +11/06/2021 22:11:10 - INFO - __main__ - Step 6677: {'lr': 0.0004987695081351824, 'samples': 1281984, 'steps': 6676, 'loss/train': 2.2747011184692383} +11/06/2021 22:11:10 - INFO - __main__ - Step 6678: {'lr': 0.0004987689822102474, 'samples': 1282176, 'steps': 6677, 'loss/train': 1.934715747833252} +11/06/2021 22:11:10 - INFO - __main__ - Step 6679: {'lr': 0.000498768456173221, 'samples': 1282368, 'steps': 6678, 'loss/train': 1.7885398864746094} +11/06/2021 22:11:11 - INFO - __main__ - Step 6680: {'lr': 0.0004987679300241033, 'samples': 1282560, 'steps': 6679, 'loss/train': 1.533270239830017} +11/06/2021 22:11:11 - INFO - __main__ - Step 6681: {'lr': 0.0004987674037628945, 'samples': 1282752, 'steps': 6680, 'loss/train': 1.9293286800384521} +11/06/2021 22:11:12 - INFO - __main__ - Step 6682: {'lr': 0.0004987668773895951, 'samples': 1282944, 'steps': 6681, 'loss/train': 1.8046060800552368} +11/06/2021 22:11:13 - INFO - __main__ - Step 6683: {'lr': 0.0004987663509042052, 'samples': 1283136, 'steps': 6682, 'loss/train': 1.674709677696228} +11/06/2021 22:11:13 - INFO - __main__ - Step 6684: {'lr': 0.000498765824306725, 'samples': 1283328, 'steps': 6683, 'loss/train': 1.765952467918396} +11/06/2021 22:11:13 - INFO - __main__ - Step 6685: {'lr': 0.0004987652975971546, 'samples': 1283520, 'steps': 6684, 'loss/train': 2.027494192123413} +11/06/2021 22:11:14 - INFO - __main__ - Step 6686: {'lr': 0.0004987647707754945, 'samples': 1283712, 'steps': 6685, 'loss/train': 1.870924949645996} +11/06/2021 22:11:15 - INFO - __main__ - Step 6687: {'lr': 0.0004987642438417449, 'samples': 1283904, 'steps': 6686, 'loss/train': 1.476467490196228} +11/06/2021 22:11:15 - INFO - __main__ - Step 6688: {'lr': 0.0004987637167959059, 'samples': 1284096, 'steps': 6687, 'loss/train': 2.0917282104492188} +11/06/2021 22:11:15 - INFO - __main__ - Step 6689: {'lr': 0.0004987631896379779, 'samples': 1284288, 'steps': 6688, 'loss/train': 1.4638168811798096} +11/06/2021 22:11:16 - INFO - __main__ - Step 6690: {'lr': 0.0004987626623679609, 'samples': 1284480, 'steps': 6689, 'loss/train': 1.3137454986572266} +11/06/2021 22:11:16 - INFO - __main__ - Step 6691: {'lr': 0.0004987621349858553, 'samples': 1284672, 'steps': 6690, 'loss/train': 2.255805015563965} +11/06/2021 22:11:17 - INFO - __main__ - Step 6692: {'lr': 0.0004987616074916615, 'samples': 1284864, 'steps': 6691, 'loss/train': 1.9453632831573486} +11/06/2021 22:11:18 - INFO - __main__ - Step 6693: {'lr': 0.0004987610798853794, 'samples': 1285056, 'steps': 6692, 'loss/train': 1.9508827924728394} +11/06/2021 22:11:18 - INFO - __main__ - Step 6694: {'lr': 0.0004987605521670094, 'samples': 1285248, 'steps': 6693, 'loss/train': 1.6768591403961182} +11/06/2021 22:11:18 - INFO - __main__ - Step 6695: {'lr': 0.0004987600243365518, 'samples': 1285440, 'steps': 6694, 'loss/train': 1.7393834590911865} +11/06/2021 22:11:19 - INFO - __main__ - Step 6696: {'lr': 0.0004987594963940066, 'samples': 1285632, 'steps': 6695, 'loss/train': 1.7367832660675049} +11/06/2021 22:11:20 - INFO - __main__ - Step 6697: {'lr': 0.0004987589683393744, 'samples': 1285824, 'steps': 6696, 'loss/train': 2.0130209922790527} +11/06/2021 22:11:20 - INFO - __main__ - Step 6698: {'lr': 0.0004987584401726552, 'samples': 1286016, 'steps': 6697, 'loss/train': 2.1210427284240723} +11/06/2021 22:11:20 - INFO - __main__ - Step 6699: {'lr': 0.0004987579118938492, 'samples': 1286208, 'steps': 6698, 'loss/train': 1.9069485664367676} +11/06/2021 22:11:21 - INFO - __main__ - Step 6700: {'lr': 0.0004987573835029569, 'samples': 1286400, 'steps': 6699, 'loss/train': 2.1391384601593018} +11/06/2021 22:11:21 - INFO - __main__ - Step 6701: {'lr': 0.0004987568549999782, 'samples': 1286592, 'steps': 6700, 'loss/train': 1.8220481872558594} +11/06/2021 22:11:22 - INFO - __main__ - Step 6702: {'lr': 0.0004987563263849136, 'samples': 1286784, 'steps': 6701, 'loss/train': 2.194391965866089} +11/06/2021 22:11:22 - INFO - __main__ - Step 6703: {'lr': 0.0004987557976577632, 'samples': 1286976, 'steps': 6702, 'loss/train': 1.930019497871399} +11/06/2021 22:11:23 - INFO - __main__ - Step 6704: {'lr': 0.0004987552688185273, 'samples': 1287168, 'steps': 6703, 'loss/train': 2.2534563541412354} +11/06/2021 22:11:23 - INFO - __main__ - Step 6705: {'lr': 0.0004987547398672061, 'samples': 1287360, 'steps': 6704, 'loss/train': 1.8196769952774048} +11/06/2021 22:11:23 - INFO - __main__ - Step 6706: {'lr': 0.0004987542108037998, 'samples': 1287552, 'steps': 6705, 'loss/train': 2.2005743980407715} +11/06/2021 22:11:24 - INFO - __main__ - Step 6707: {'lr': 0.0004987536816283087, 'samples': 1287744, 'steps': 6706, 'loss/train': 1.494478702545166} +11/06/2021 22:11:25 - INFO - __main__ - Step 6708: {'lr': 0.0004987531523407331, 'samples': 1287936, 'steps': 6707, 'loss/train': 1.9010131359100342} +11/06/2021 22:11:25 - INFO - __main__ - Step 6709: {'lr': 0.0004987526229410732, 'samples': 1288128, 'steps': 6708, 'loss/train': 1.8058475255966187} +11/06/2021 22:11:25 - INFO - __main__ - Step 6710: {'lr': 0.000498752093429329, 'samples': 1288320, 'steps': 6709, 'loss/train': 1.8113231658935547} +11/06/2021 22:11:26 - INFO - __main__ - Step 6711: {'lr': 0.0004987515638055012, 'samples': 1288512, 'steps': 6710, 'loss/train': 1.8796414136886597} +11/06/2021 22:11:27 - INFO - __main__ - Step 6712: {'lr': 0.0004987510340695896, 'samples': 1288704, 'steps': 6711, 'loss/train': 2.1111533641815186} +11/06/2021 22:11:27 - INFO - __main__ - Step 6713: {'lr': 0.0004987505042215948, 'samples': 1288896, 'steps': 6712, 'loss/train': 2.0792810916900635} +11/06/2021 22:11:27 - INFO - __main__ - Step 6714: {'lr': 0.0004987499742615167, 'samples': 1289088, 'steps': 6713, 'loss/train': 1.8710038661956787} +11/06/2021 22:11:28 - INFO - __main__ - Step 6715: {'lr': 0.0004987494441893557, 'samples': 1289280, 'steps': 6714, 'loss/train': 2.19236421585083} +11/06/2021 22:11:28 - INFO - __main__ - Step 6716: {'lr': 0.0004987489140051121, 'samples': 1289472, 'steps': 6715, 'loss/train': 2.288778066635132} +11/06/2021 22:11:29 - INFO - __main__ - Step 6717: {'lr': 0.000498748383708786, 'samples': 1289664, 'steps': 6716, 'loss/train': 1.4987444877624512} +11/06/2021 22:11:30 - INFO - __main__ - Step 6718: {'lr': 0.0004987478533003779, 'samples': 1289856, 'steps': 6717, 'loss/train': 1.6623836755752563} +11/06/2021 22:11:30 - INFO - __main__ - Step 6719: {'lr': 0.0004987473227798877, 'samples': 1290048, 'steps': 6718, 'loss/train': 1.9826804399490356} +11/06/2021 22:11:30 - INFO - __main__ - Step 6720: {'lr': 0.0004987467921473157, 'samples': 1290240, 'steps': 6719, 'loss/train': 1.859378457069397} +11/06/2021 22:11:31 - INFO - __main__ - Step 6721: {'lr': 0.0004987462614026624, 'samples': 1290432, 'steps': 6720, 'loss/train': 1.4481638669967651} +11/06/2021 22:11:32 - INFO - __main__ - Step 6722: {'lr': 0.0004987457305459279, 'samples': 1290624, 'steps': 6721, 'loss/train': 1.673604965209961} +11/06/2021 22:11:32 - INFO - __main__ - Step 6723: {'lr': 0.0004987451995771124, 'samples': 1290816, 'steps': 6722, 'loss/train': 1.731692910194397} +11/06/2021 22:11:32 - INFO - __main__ - Step 6724: {'lr': 0.000498744668496216, 'samples': 1291008, 'steps': 6723, 'loss/train': 1.4091925621032715} +11/06/2021 22:11:33 - INFO - __main__ - Step 6725: {'lr': 0.0004987441373032393, 'samples': 1291200, 'steps': 6724, 'loss/train': 1.264276385307312} +11/06/2021 22:11:33 - INFO - __main__ - Step 6726: {'lr': 0.0004987436059981821, 'samples': 1291392, 'steps': 6725, 'loss/train': 1.7149850130081177} +11/06/2021 22:11:34 - INFO - __main__ - Step 6727: {'lr': 0.0004987430745810451, 'samples': 1291584, 'steps': 6726, 'loss/train': 1.8684431314468384} +11/06/2021 22:11:34 - INFO - __main__ - Step 6728: {'lr': 0.0004987425430518282, 'samples': 1291776, 'steps': 6727, 'loss/train': 1.2485170364379883} +11/06/2021 22:11:35 - INFO - __main__ - Step 6729: {'lr': 0.0004987420114105317, 'samples': 1291968, 'steps': 6728, 'loss/train': 1.7726978063583374} +11/06/2021 22:11:35 - INFO - __main__ - Step 6730: {'lr': 0.000498741479657156, 'samples': 1292160, 'steps': 6729, 'loss/train': 2.122650146484375} +11/06/2021 22:11:35 - INFO - __main__ - Step 6731: {'lr': 0.0004987409477917011, 'samples': 1292352, 'steps': 6730, 'loss/train': 2.2055673599243164} +11/06/2021 22:11:36 - INFO - __main__ - Step 6732: {'lr': 0.0004987404158141675, 'samples': 1292544, 'steps': 6731, 'loss/train': 1.7402311563491821} +11/06/2021 22:11:37 - INFO - __main__ - Step 6733: {'lr': 0.0004987398837245552, 'samples': 1292736, 'steps': 6732, 'loss/train': 2.053032159805298} +11/06/2021 22:11:37 - INFO - __main__ - Step 6734: {'lr': 0.0004987393515228646, 'samples': 1292928, 'steps': 6733, 'loss/train': 1.614290475845337} +11/06/2021 22:11:38 - INFO - __main__ - Step 6735: {'lr': 0.0004987388192090959, 'samples': 1293120, 'steps': 6734, 'loss/train': 1.5254181623458862} +11/06/2021 22:11:38 - INFO - __main__ - Step 6736: {'lr': 0.0004987382867832493, 'samples': 1293312, 'steps': 6735, 'loss/train': 2.606459379196167} +11/06/2021 22:11:38 - INFO - __main__ - Step 6737: {'lr': 0.0004987377542453251, 'samples': 1293504, 'steps': 6736, 'loss/train': 1.3655518293380737} +11/06/2021 22:11:39 - INFO - __main__ - Step 6738: {'lr': 0.0004987372215953234, 'samples': 1293696, 'steps': 6737, 'loss/train': 1.8274635076522827} +11/06/2021 22:11:40 - INFO - __main__ - Step 6739: {'lr': 0.0004987366888332446, 'samples': 1293888, 'steps': 6738, 'loss/train': 1.5153939723968506} +11/06/2021 22:11:40 - INFO - __main__ - Step 6740: {'lr': 0.0004987361559590889, 'samples': 1294080, 'steps': 6739, 'loss/train': 2.4495294094085693} +11/06/2021 22:11:40 - INFO - __main__ - Step 6741: {'lr': 0.0004987356229728566, 'samples': 1294272, 'steps': 6740, 'loss/train': 1.0965790748596191} +11/06/2021 22:11:41 - INFO - __main__ - Step 6742: {'lr': 0.0004987350898745477, 'samples': 1294464, 'steps': 6741, 'loss/train': 1.4959521293640137} +11/06/2021 22:11:42 - INFO - __main__ - Step 6743: {'lr': 0.0004987345566641628, 'samples': 1294656, 'steps': 6742, 'loss/train': 0.2513975501060486} +11/06/2021 22:11:42 - INFO - __main__ - Step 6744: {'lr': 0.0004987340233417019, 'samples': 1294848, 'steps': 6743, 'loss/train': 1.892668604850769} +11/06/2021 22:11:42 - INFO - __main__ - Step 6745: {'lr': 0.0004987334899071652, 'samples': 1295040, 'steps': 6744, 'loss/train': 3.132077217102051} +11/06/2021 22:11:43 - INFO - __main__ - Step 6746: {'lr': 0.000498732956360553, 'samples': 1295232, 'steps': 6745, 'loss/train': 2.2569050788879395} +11/06/2021 22:11:43 - INFO - __main__ - Step 6747: {'lr': 0.0004987324227018657, 'samples': 1295424, 'steps': 6746, 'loss/train': 2.1900782585144043} +11/06/2021 22:11:44 - INFO - __main__ - Step 6748: {'lr': 0.0004987318889311033, 'samples': 1295616, 'steps': 6747, 'loss/train': 2.0776844024658203} +11/06/2021 22:11:45 - INFO - __main__ - Step 6749: {'lr': 0.0004987313550482663, 'samples': 1295808, 'steps': 6748, 'loss/train': 2.524590253829956} +11/06/2021 22:11:45 - INFO - __main__ - Step 6750: {'lr': 0.0004987308210533546, 'samples': 1296000, 'steps': 6749, 'loss/train': 2.416774272918701} +11/06/2021 22:11:45 - INFO - __main__ - Step 6751: {'lr': 0.0004987302869463686, 'samples': 1296192, 'steps': 6750, 'loss/train': 1.5255533456802368} +11/06/2021 22:11:46 - INFO - __main__ - Step 6752: {'lr': 0.0004987297527273088, 'samples': 1296384, 'steps': 6751, 'loss/train': 1.5347144603729248} +11/06/2021 22:11:47 - INFO - __main__ - Step 6753: {'lr': 0.0004987292183961751, 'samples': 1296576, 'steps': 6752, 'loss/train': 1.8391497135162354} +11/06/2021 22:11:47 - INFO - __main__ - Step 6754: {'lr': 0.0004987286839529679, 'samples': 1296768, 'steps': 6753, 'loss/train': 1.9722280502319336} +11/06/2021 22:11:47 - INFO - __main__ - Step 6755: {'lr': 0.0004987281493976873, 'samples': 1296960, 'steps': 6754, 'loss/train': 1.6345213651657104} +11/06/2021 22:11:48 - INFO - __main__ - Step 6756: {'lr': 0.0004987276147303337, 'samples': 1297152, 'steps': 6755, 'loss/train': 1.5767613649368286} +11/06/2021 22:11:48 - INFO - __main__ - Step 6757: {'lr': 0.0004987270799509071, 'samples': 1297344, 'steps': 6756, 'loss/train': 1.8740566968917847} +11/06/2021 22:11:49 - INFO - __main__ - Step 6758: {'lr': 0.0004987265450594082, 'samples': 1297536, 'steps': 6757, 'loss/train': 1.6574358940124512} +11/06/2021 22:11:49 - INFO - __main__ - Step 6759: {'lr': 0.0004987260100558368, 'samples': 1297728, 'steps': 6758, 'loss/train': 2.1299595832824707} +11/06/2021 22:11:50 - INFO - __main__ - Step 6760: {'lr': 0.0004987254749401933, 'samples': 1297920, 'steps': 6759, 'loss/train': 1.5151968002319336} +11/06/2021 22:11:50 - INFO - __main__ - Step 6761: {'lr': 0.000498724939712478, 'samples': 1298112, 'steps': 6760, 'loss/train': 2.2985787391662598} +11/06/2021 22:11:51 - INFO - __main__ - Step 6762: {'lr': 0.000498724404372691, 'samples': 1298304, 'steps': 6761, 'loss/train': 2.6387453079223633} +11/06/2021 22:11:51 - INFO - __main__ - Step 6763: {'lr': 0.0004987238689208327, 'samples': 1298496, 'steps': 6762, 'loss/train': 1.8828072547912598} +11/06/2021 22:11:52 - INFO - __main__ - Step 6764: {'lr': 0.0004987233333569031, 'samples': 1298688, 'steps': 6763, 'loss/train': 2.250027894973755} +11/06/2021 22:11:52 - INFO - __main__ - Step 6765: {'lr': 0.0004987227976809028, 'samples': 1298880, 'steps': 6764, 'loss/train': 1.8417761325836182} +11/06/2021 22:11:53 - INFO - __main__ - Step 6766: {'lr': 0.0004987222618928318, 'samples': 1299072, 'steps': 6765, 'loss/train': 1.9207943677902222} +11/06/2021 22:11:53 - INFO - __main__ - Step 6767: {'lr': 0.0004987217259926904, 'samples': 1299264, 'steps': 6766, 'loss/train': 0.23178565502166748} +11/06/2021 22:11:53 - INFO - __main__ - Step 6768: {'lr': 0.0004987211899804788, 'samples': 1299456, 'steps': 6767, 'loss/train': 1.8414160013198853} +11/06/2021 22:11:55 - INFO - __main__ - Step 6769: {'lr': 0.0004987206538561972, 'samples': 1299648, 'steps': 6768, 'loss/train': 1.939680814743042} +11/06/2021 22:11:55 - INFO - __main__ - Step 6770: {'lr': 0.000498720117619846, 'samples': 1299840, 'steps': 6769, 'loss/train': 1.4610973596572876} +11/06/2021 22:11:55 - INFO - __main__ - Step 6771: {'lr': 0.0004987195812714252, 'samples': 1300032, 'steps': 6770, 'loss/train': 1.526523232460022} +11/06/2021 22:11:56 - INFO - __main__ - Step 6772: {'lr': 0.0004987190448109354, 'samples': 1300224, 'steps': 6771, 'loss/train': 2.2244198322296143} +11/06/2021 22:11:56 - INFO - __main__ - Step 6773: {'lr': 0.0004987185082383765, 'samples': 1300416, 'steps': 6772, 'loss/train': 1.7443127632141113} +11/06/2021 22:11:56 - INFO - __main__ - Step 6774: {'lr': 0.000498717971553749, 'samples': 1300608, 'steps': 6773, 'loss/train': 2.230355978012085} +11/06/2021 22:11:57 - INFO - __main__ - Step 6775: {'lr': 0.0004987174347570529, 'samples': 1300800, 'steps': 6774, 'loss/train': 0.42308324575424194} +11/06/2021 22:11:58 - INFO - __main__ - Step 6776: {'lr': 0.0004987168978482886, 'samples': 1300992, 'steps': 6775, 'loss/train': 1.6637697219848633} +11/06/2021 22:11:58 - INFO - __main__ - Step 6777: {'lr': 0.0004987163608274564, 'samples': 1301184, 'steps': 6776, 'loss/train': 1.6888412237167358} +11/06/2021 22:11:58 - INFO - __main__ - Step 6778: {'lr': 0.0004987158236945563, 'samples': 1301376, 'steps': 6777, 'loss/train': 1.6136714220046997} +11/06/2021 22:11:59 - INFO - __main__ - Step 6779: {'lr': 0.0004987152864495887, 'samples': 1301568, 'steps': 6778, 'loss/train': 2.1859946250915527} +11/06/2021 22:12:00 - INFO - __main__ - Step 6780: {'lr': 0.000498714749092554, 'samples': 1301760, 'steps': 6779, 'loss/train': 1.9430932998657227} +11/06/2021 22:12:00 - INFO - __main__ - Step 6781: {'lr': 0.0004987142116234521, 'samples': 1301952, 'steps': 6780, 'loss/train': 1.1831541061401367} +11/06/2021 22:12:00 - INFO - __main__ - Step 6782: {'lr': 0.0004987136740422835, 'samples': 1302144, 'steps': 6781, 'loss/train': 1.972415566444397} +11/06/2021 22:12:01 - INFO - __main__ - Step 6783: {'lr': 0.0004987131363490483, 'samples': 1302336, 'steps': 6782, 'loss/train': 1.6971096992492676} +11/06/2021 22:12:01 - INFO - __main__ - Step 6784: {'lr': 0.0004987125985437468, 'samples': 1302528, 'steps': 6783, 'loss/train': 2.15081524848938} +11/06/2021 22:12:02 - INFO - __main__ - Step 6785: {'lr': 0.0004987120606263794, 'samples': 1302720, 'steps': 6784, 'loss/train': 2.056392192840576} +11/06/2021 22:12:03 - INFO - __main__ - Step 6786: {'lr': 0.000498711522596946, 'samples': 1302912, 'steps': 6785, 'loss/train': 1.852485179901123} +11/06/2021 22:12:03 - INFO - __main__ - Step 6787: {'lr': 0.000498710984455447, 'samples': 1303104, 'steps': 6786, 'loss/train': 1.6676357984542847} +11/06/2021 22:12:03 - INFO - __main__ - Step 6788: {'lr': 0.0004987104462018828, 'samples': 1303296, 'steps': 6787, 'loss/train': 1.6238676309585571} +11/06/2021 22:12:04 - INFO - __main__ - Step 6789: {'lr': 0.0004987099078362534, 'samples': 1303488, 'steps': 6788, 'loss/train': 1.8077821731567383} +11/06/2021 22:12:05 - INFO - __main__ - Step 6790: {'lr': 0.0004987093693585591, 'samples': 1303680, 'steps': 6789, 'loss/train': 2.1676840782165527} +11/06/2021 22:12:05 - INFO - __main__ - Step 6791: {'lr': 0.0004987088307688004, 'samples': 1303872, 'steps': 6790, 'loss/train': 0.8062730431556702} +11/06/2021 22:12:05 - INFO - __main__ - Step 6792: {'lr': 0.0004987082920669772, 'samples': 1304064, 'steps': 6791, 'loss/train': 1.5815889835357666} +11/06/2021 22:12:06 - INFO - __main__ - Step 6793: {'lr': 0.0004987077532530899, 'samples': 1304256, 'steps': 6792, 'loss/train': 1.743523120880127} +11/06/2021 22:12:06 - INFO - __main__ - Step 6794: {'lr': 0.0004987072143271388, 'samples': 1304448, 'steps': 6793, 'loss/train': 1.1385010480880737} +11/06/2021 22:12:07 - INFO - __main__ - Step 6795: {'lr': 0.000498706675289124, 'samples': 1304640, 'steps': 6794, 'loss/train': 1.5993659496307373} +11/06/2021 22:12:07 - INFO - __main__ - Step 6796: {'lr': 0.0004987061361390458, 'samples': 1304832, 'steps': 6795, 'loss/train': 1.9786431789398193} +11/06/2021 22:12:08 - INFO - __main__ - Step 6797: {'lr': 0.0004987055968769045, 'samples': 1305024, 'steps': 6796, 'loss/train': 1.779247522354126} +11/06/2021 22:12:08 - INFO - __main__ - Step 6798: {'lr': 0.0004987050575027002, 'samples': 1305216, 'steps': 6797, 'loss/train': 1.8261228799819946} +11/06/2021 22:12:08 - INFO - __main__ - Step 6799: {'lr': 0.0004987045180164333, 'samples': 1305408, 'steps': 6798, 'loss/train': 1.5211654901504517} +11/06/2021 22:12:10 - INFO - __main__ - Step 6800: {'lr': 0.0004987039784181041, 'samples': 1305600, 'steps': 6799, 'loss/train': 0.9507125616073608} +11/06/2021 22:12:10 - INFO - __main__ - Step 6801: {'lr': 0.0004987034387077126, 'samples': 1305792, 'steps': 6800, 'loss/train': 1.7004783153533936} +11/06/2021 22:12:10 - INFO - __main__ - Step 6802: {'lr': 0.0004987028988852592, 'samples': 1305984, 'steps': 6801, 'loss/train': 2.2649049758911133} +11/06/2021 22:12:11 - INFO - __main__ - Step 6803: {'lr': 0.0004987023589507441, 'samples': 1306176, 'steps': 6802, 'loss/train': 1.9656171798706055} +11/06/2021 22:12:11 - INFO - __main__ - Step 6804: {'lr': 0.0004987018189041675, 'samples': 1306368, 'steps': 6803, 'loss/train': 1.7351499795913696} +11/06/2021 22:12:12 - INFO - __main__ - Step 6805: {'lr': 0.0004987012787455297, 'samples': 1306560, 'steps': 6804, 'loss/train': 1.2826176881790161} +11/06/2021 22:12:12 - INFO - __main__ - Step 6806: {'lr': 0.000498700738474831, 'samples': 1306752, 'steps': 6805, 'loss/train': 1.076385736465454} +11/06/2021 22:12:13 - INFO - __main__ - Step 6807: {'lr': 0.0004987001980920716, 'samples': 1306944, 'steps': 6806, 'loss/train': 1.8413560390472412} +11/06/2021 22:12:13 - INFO - __main__ - Step 6808: {'lr': 0.0004986996575972517, 'samples': 1307136, 'steps': 6807, 'loss/train': 0.7521131038665771} +11/06/2021 22:12:13 - INFO - __main__ - Step 6809: {'lr': 0.0004986991169903716, 'samples': 1307328, 'steps': 6808, 'loss/train': 2.316514015197754} +11/06/2021 22:12:14 - INFO - __main__ - Step 6810: {'lr': 0.0004986985762714314, 'samples': 1307520, 'steps': 6809, 'loss/train': 2.3181118965148926} +11/06/2021 22:12:15 - INFO - __main__ - Step 6811: {'lr': 0.0004986980354404316, 'samples': 1307712, 'steps': 6810, 'loss/train': 1.841756820678711} +11/06/2021 22:12:15 - INFO - __main__ - Step 6812: {'lr': 0.0004986974944973723, 'samples': 1307904, 'steps': 6811, 'loss/train': 2.5697433948516846} +11/06/2021 22:12:16 - INFO - __main__ - Step 6813: {'lr': 0.0004986969534422537, 'samples': 1308096, 'steps': 6812, 'loss/train': 0.27386459708213806} +11/06/2021 22:12:16 - INFO - __main__ - Step 6814: {'lr': 0.000498696412275076, 'samples': 1308288, 'steps': 6813, 'loss/train': 1.9443211555480957} +11/06/2021 22:12:16 - INFO - __main__ - Step 6815: {'lr': 0.0004986958709958396, 'samples': 1308480, 'steps': 6814, 'loss/train': 1.8300877809524536} +11/06/2021 22:12:18 - INFO - __main__ - Step 6816: {'lr': 0.0004986953296045448, 'samples': 1308672, 'steps': 6815, 'loss/train': 1.716494083404541} +11/06/2021 22:12:18 - INFO - __main__ - Step 6817: {'lr': 0.0004986947881011917, 'samples': 1308864, 'steps': 6816, 'loss/train': 1.5828531980514526} +11/06/2021 22:12:18 - INFO - __main__ - Step 6818: {'lr': 0.0004986942464857804, 'samples': 1309056, 'steps': 6817, 'loss/train': 1.8163785934448242} +11/06/2021 22:12:19 - INFO - __main__ - Step 6819: {'lr': 0.0004986937047583114, 'samples': 1309248, 'steps': 6818, 'loss/train': 1.8825898170471191} +11/06/2021 22:12:19 - INFO - __main__ - Step 6820: {'lr': 0.0004986931629187848, 'samples': 1309440, 'steps': 6819, 'loss/train': 2.2714736461639404} +11/06/2021 22:12:20 - INFO - __main__ - Step 6821: {'lr': 0.0004986926209672011, 'samples': 1309632, 'steps': 6820, 'loss/train': 2.2257802486419678} +11/06/2021 22:12:20 - INFO - __main__ - Step 6822: {'lr': 0.0004986920789035601, 'samples': 1309824, 'steps': 6821, 'loss/train': 1.6289818286895752} +11/06/2021 22:12:21 - INFO - __main__ - Step 6823: {'lr': 0.0004986915367278623, 'samples': 1310016, 'steps': 6822, 'loss/train': 1.8991657495498657} +11/06/2021 22:12:21 - INFO - __main__ - Step 6824: {'lr': 0.0004986909944401082, 'samples': 1310208, 'steps': 6823, 'loss/train': 1.4807871580123901} +11/06/2021 22:12:21 - INFO - __main__ - Step 6825: {'lr': 0.0004986904520402975, 'samples': 1310400, 'steps': 6824, 'loss/train': 1.9092999696731567} +11/06/2021 22:12:23 - INFO - __main__ - Step 6826: {'lr': 0.0004986899095284308, 'samples': 1310592, 'steps': 6825, 'loss/train': 2.1994271278381348} +11/06/2021 22:12:23 - INFO - __main__ - Step 6827: {'lr': 0.0004986893669045083, 'samples': 1310784, 'steps': 6826, 'loss/train': 2.3838884830474854} +11/06/2021 22:12:23 - INFO - __main__ - Step 6828: {'lr': 0.0004986888241685301, 'samples': 1310976, 'steps': 6827, 'loss/train': 1.6222882270812988} +11/06/2021 22:12:24 - INFO - __main__ - Step 6829: {'lr': 0.0004986882813204967, 'samples': 1311168, 'steps': 6828, 'loss/train': 2.6850411891937256} +11/06/2021 22:12:24 - INFO - __main__ - Step 6830: {'lr': 0.0004986877383604081, 'samples': 1311360, 'steps': 6829, 'loss/train': 1.8489203453063965} +11/06/2021 22:12:25 - INFO - __main__ - Step 6831: {'lr': 0.0004986871952882647, 'samples': 1311552, 'steps': 6830, 'loss/train': 1.933595061302185} +11/06/2021 22:12:25 - INFO - __main__ - Step 6832: {'lr': 0.0004986866521040666, 'samples': 1311744, 'steps': 6831, 'loss/train': 1.9676979780197144} +11/06/2021 22:12:26 - INFO - __main__ - Step 6833: {'lr': 0.0004986861088078142, 'samples': 1311936, 'steps': 6832, 'loss/train': 1.3297863006591797} +11/06/2021 22:12:26 - INFO - __main__ - Step 6834: {'lr': 0.0004986855653995077, 'samples': 1312128, 'steps': 6833, 'loss/train': 0.9145995378494263} +11/06/2021 22:12:26 - INFO - __main__ - Step 6835: {'lr': 0.0004986850218791474, 'samples': 1312320, 'steps': 6834, 'loss/train': 2.046581983566284} +11/06/2021 22:12:28 - INFO - __main__ - Step 6836: {'lr': 0.0004986844782467332, 'samples': 1312512, 'steps': 6835, 'loss/train': 1.6971626281738281} +11/06/2021 22:12:28 - INFO - __main__ - Step 6837: {'lr': 0.0004986839345022658, 'samples': 1312704, 'steps': 6836, 'loss/train': 1.80866539478302} +11/06/2021 22:12:29 - INFO - __main__ - Step 6838: {'lr': 0.0004986833906457453, 'samples': 1312896, 'steps': 6837, 'loss/train': 2.049255609512329} +11/06/2021 22:12:29 - INFO - __main__ - Step 6839: {'lr': 0.0004986828466771718, 'samples': 1313088, 'steps': 6838, 'loss/train': 2.1545591354370117} +11/06/2021 22:12:29 - INFO - __main__ - Step 6840: {'lr': 0.0004986823025965457, 'samples': 1313280, 'steps': 6839, 'loss/train': 1.8146533966064453} +11/06/2021 22:12:30 - INFO - __main__ - Step 6841: {'lr': 0.0004986817584038671, 'samples': 1313472, 'steps': 6840, 'loss/train': 1.6725200414657593} +11/06/2021 22:12:31 - INFO - __main__ - Step 6842: {'lr': 0.0004986812140991365, 'samples': 1313664, 'steps': 6841, 'loss/train': 2.010808229446411} +11/06/2021 22:12:31 - INFO - __main__ - Step 6843: {'lr': 0.0004986806696823538, 'samples': 1313856, 'steps': 6842, 'loss/train': 1.6977182626724243} +11/06/2021 22:12:31 - INFO - __main__ - Step 6844: {'lr': 0.0004986801251535195, 'samples': 1314048, 'steps': 6843, 'loss/train': 1.7137373685836792} +11/06/2021 22:12:32 - INFO - __main__ - Step 6845: {'lr': 0.0004986795805126339, 'samples': 1314240, 'steps': 6844, 'loss/train': 1.878450632095337} +11/06/2021 22:12:32 - INFO - __main__ - Step 6846: {'lr': 0.000498679035759697, 'samples': 1314432, 'steps': 6845, 'loss/train': 1.5944817066192627} +11/06/2021 22:12:33 - INFO - __main__ - Step 6847: {'lr': 0.0004986784908947091, 'samples': 1314624, 'steps': 6846, 'loss/train': 1.7078269720077515} +11/06/2021 22:12:34 - INFO - __main__ - Step 6848: {'lr': 0.0004986779459176706, 'samples': 1314816, 'steps': 6847, 'loss/train': 1.9563493728637695} +11/06/2021 22:12:34 - INFO - __main__ - Step 6849: {'lr': 0.0004986774008285816, 'samples': 1315008, 'steps': 6848, 'loss/train': 1.9744795560836792} +11/06/2021 22:12:34 - INFO - __main__ - Step 6850: {'lr': 0.0004986768556274425, 'samples': 1315200, 'steps': 6849, 'loss/train': 1.5663435459136963} +11/06/2021 22:12:35 - INFO - __main__ - Step 6851: {'lr': 0.0004986763103142533, 'samples': 1315392, 'steps': 6850, 'loss/train': 1.9012843370437622} +11/06/2021 22:12:36 - INFO - __main__ - Step 6852: {'lr': 0.0004986757648890145, 'samples': 1315584, 'steps': 6851, 'loss/train': 1.9131489992141724} +11/06/2021 22:12:36 - INFO - __main__ - Step 6853: {'lr': 0.0004986752193517262, 'samples': 1315776, 'steps': 6852, 'loss/train': 1.6437551975250244} +11/06/2021 22:12:36 - INFO - __main__ - Step 6854: {'lr': 0.0004986746737023887, 'samples': 1315968, 'steps': 6853, 'loss/train': 0.30247291922569275} +11/06/2021 22:12:37 - INFO - __main__ - Step 6855: {'lr': 0.0004986741279410023, 'samples': 1316160, 'steps': 6854, 'loss/train': 2.0035195350646973} +11/06/2021 22:12:37 - INFO - __main__ - Step 6856: {'lr': 0.000498673582067567, 'samples': 1316352, 'steps': 6855, 'loss/train': 1.685018539428711} +11/06/2021 22:12:38 - INFO - __main__ - Step 6857: {'lr': 0.0004986730360820833, 'samples': 1316544, 'steps': 6856, 'loss/train': 1.0697712898254395} +11/06/2021 22:12:39 - INFO - __main__ - Step 6858: {'lr': 0.0004986724899845514, 'samples': 1316736, 'steps': 6857, 'loss/train': 1.4516496658325195} +11/06/2021 22:12:39 - INFO - __main__ - Step 6859: {'lr': 0.0004986719437749716, 'samples': 1316928, 'steps': 6858, 'loss/train': 2.176100730895996} +11/06/2021 22:12:39 - INFO - __main__ - Step 6860: {'lr': 0.0004986713974533439, 'samples': 1317120, 'steps': 6859, 'loss/train': 1.1705691814422607} +11/06/2021 22:12:40 - INFO - __main__ - Step 6861: {'lr': 0.0004986708510196688, 'samples': 1317312, 'steps': 6860, 'loss/train': 1.852432131767273} +11/06/2021 22:12:40 - INFO - __main__ - Step 6862: {'lr': 0.0004986703044739464, 'samples': 1317504, 'steps': 6861, 'loss/train': 1.9012736082077026} +11/06/2021 22:12:41 - INFO - __main__ - Step 6863: {'lr': 0.000498669757816177, 'samples': 1317696, 'steps': 6862, 'loss/train': 2.041994333267212} +11/06/2021 22:12:41 - INFO - __main__ - Step 6864: {'lr': 0.0004986692110463609, 'samples': 1317888, 'steps': 6863, 'loss/train': 0.9249697327613831} +11/06/2021 22:12:42 - INFO - __main__ - Step 6865: {'lr': 0.0004986686641644982, 'samples': 1318080, 'steps': 6864, 'loss/train': 1.9790064096450806} +11/06/2021 22:12:42 - INFO - __main__ - Step 6866: {'lr': 0.0004986681171705893, 'samples': 1318272, 'steps': 6865, 'loss/train': 1.9213021993637085} +11/06/2021 22:12:42 - INFO - __main__ - Step 6867: {'lr': 0.0004986675700646343, 'samples': 1318464, 'steps': 6866, 'loss/train': 1.9628852605819702} +11/06/2021 22:12:43 - INFO - __main__ - Step 6868: {'lr': 0.0004986670228466337, 'samples': 1318656, 'steps': 6867, 'loss/train': 2.0977110862731934} +11/06/2021 22:12:44 - INFO - __main__ - Step 6869: {'lr': 0.0004986664755165874, 'samples': 1318848, 'steps': 6868, 'loss/train': 1.4509758949279785} +11/06/2021 22:12:44 - INFO - __main__ - Step 6870: {'lr': 0.000498665928074496, 'samples': 1319040, 'steps': 6869, 'loss/train': 1.9043452739715576} +11/06/2021 22:12:44 - INFO - __main__ - Step 6871: {'lr': 0.0004986653805203594, 'samples': 1319232, 'steps': 6870, 'loss/train': 1.188199520111084} +11/06/2021 22:12:45 - INFO - __main__ - Step 6872: {'lr': 0.0004986648328541781, 'samples': 1319424, 'steps': 6871, 'loss/train': 1.6279737949371338} +11/06/2021 22:12:46 - INFO - __main__ - Step 6873: {'lr': 0.0004986642850759522, 'samples': 1319616, 'steps': 6872, 'loss/train': 1.2891004085540771} +11/06/2021 22:12:46 - INFO - __main__ - Step 6874: {'lr': 0.0004986637371856822, 'samples': 1319808, 'steps': 6873, 'loss/train': 2.0982792377471924} +11/06/2021 22:12:47 - INFO - __main__ - Step 6875: {'lr': 0.000498663189183368, 'samples': 1320000, 'steps': 6874, 'loss/train': 1.6079758405685425} +11/06/2021 22:12:47 - INFO - __main__ - Step 6876: {'lr': 0.0004986626410690099, 'samples': 1320192, 'steps': 6875, 'loss/train': 1.3328086137771606} +11/06/2021 22:12:47 - INFO - __main__ - Step 6877: {'lr': 0.0004986620928426085, 'samples': 1320384, 'steps': 6876, 'loss/train': 1.9018620252609253} +11/06/2021 22:12:48 - INFO - __main__ - Step 6878: {'lr': 0.0004986615445041636, 'samples': 1320576, 'steps': 6877, 'loss/train': 1.5764297246932983} +11/06/2021 22:12:49 - INFO - __main__ - Step 6879: {'lr': 0.0004986609960536757, 'samples': 1320768, 'steps': 6878, 'loss/train': 1.831556797027588} +11/06/2021 22:12:49 - INFO - __main__ - Step 6880: {'lr': 0.000498660447491145, 'samples': 1320960, 'steps': 6879, 'loss/train': 1.3842569589614868} +11/06/2021 22:12:49 - INFO - __main__ - Step 6881: {'lr': 0.0004986598988165718, 'samples': 1321152, 'steps': 6880, 'loss/train': 2.5729262828826904} +11/06/2021 22:12:50 - INFO - __main__ - Step 6882: {'lr': 0.0004986593500299562, 'samples': 1321344, 'steps': 6881, 'loss/train': 2.3645272254943848} +11/06/2021 22:12:51 - INFO - __main__ - Step 6883: {'lr': 0.0004986588011312986, 'samples': 1321536, 'steps': 6882, 'loss/train': 1.524306058883667} +11/06/2021 22:12:51 - INFO - __main__ - Step 6884: {'lr': 0.0004986582521205992, 'samples': 1321728, 'steps': 6883, 'loss/train': 2.1317756175994873} +11/06/2021 22:12:51 - INFO - __main__ - Step 6885: {'lr': 0.0004986577029978581, 'samples': 1321920, 'steps': 6884, 'loss/train': 2.3129236698150635} +11/06/2021 22:12:52 - INFO - __main__ - Step 6886: {'lr': 0.0004986571537630757, 'samples': 1322112, 'steps': 6885, 'loss/train': 1.8439607620239258} +11/06/2021 22:12:52 - INFO - __main__ - Step 6887: {'lr': 0.0004986566044162523, 'samples': 1322304, 'steps': 6886, 'loss/train': 2.0930988788604736} +11/06/2021 22:12:53 - INFO - __main__ - Step 6888: {'lr': 0.0004986560549573881, 'samples': 1322496, 'steps': 6887, 'loss/train': 2.0430047512054443} +11/06/2021 22:12:53 - INFO - __main__ - Step 6889: {'lr': 0.0004986555053864833, 'samples': 1322688, 'steps': 6888, 'loss/train': 1.7372727394104004} +11/06/2021 22:12:54 - INFO - __main__ - Step 6890: {'lr': 0.0004986549557035381, 'samples': 1322880, 'steps': 6889, 'loss/train': 1.7419931888580322} +11/06/2021 22:12:54 - INFO - __main__ - Step 6891: {'lr': 0.0004986544059085528, 'samples': 1323072, 'steps': 6890, 'loss/train': 1.3079571723937988} +11/06/2021 22:12:55 - INFO - __main__ - Step 6892: {'lr': 0.0004986538560015277, 'samples': 1323264, 'steps': 6891, 'loss/train': 2.068556070327759} +11/06/2021 22:12:56 - INFO - __main__ - Step 6893: {'lr': 0.000498653305982463, 'samples': 1323456, 'steps': 6892, 'loss/train': 1.350880742073059} +11/06/2021 22:12:56 - INFO - __main__ - Step 6894: {'lr': 0.0004986527558513591, 'samples': 1323648, 'steps': 6893, 'loss/train': 1.4500173330307007} +11/06/2021 22:12:56 - INFO - __main__ - Step 6895: {'lr': 0.0004986522056082159, 'samples': 1323840, 'steps': 6894, 'loss/train': 2.146724224090576} +11/06/2021 22:12:57 - INFO - __main__ - Step 6896: {'lr': 0.0004986516552530339, 'samples': 1324032, 'steps': 6895, 'loss/train': 1.203369140625} +11/06/2021 22:12:57 - INFO - __main__ - Step 6897: {'lr': 0.0004986511047858134, 'samples': 1324224, 'steps': 6896, 'loss/train': 2.2133257389068604} +11/06/2021 22:12:57 - INFO - __main__ - Step 6898: {'lr': 0.0004986505542065545, 'samples': 1324416, 'steps': 6897, 'loss/train': 2.0129928588867188} +11/06/2021 22:12:58 - INFO - __main__ - Step 6899: {'lr': 0.0004986500035152574, 'samples': 1324608, 'steps': 6898, 'loss/train': 2.3049161434173584} +11/06/2021 22:12:59 - INFO - __main__ - Step 6900: {'lr': 0.0004986494527119226, 'samples': 1324800, 'steps': 6899, 'loss/train': 1.816585898399353} +11/06/2021 22:12:59 - INFO - __main__ - Step 6901: {'lr': 0.0004986489017965501, 'samples': 1324992, 'steps': 6900, 'loss/train': 1.263410210609436} +11/06/2021 22:12:59 - INFO - __main__ - Step 6902: {'lr': 0.0004986483507691403, 'samples': 1325184, 'steps': 6901, 'loss/train': 1.9309344291687012} +11/06/2021 22:13:00 - INFO - __main__ - Step 6903: {'lr': 0.0004986477996296934, 'samples': 1325376, 'steps': 6902, 'loss/train': 1.9613704681396484} +11/06/2021 22:13:01 - INFO - __main__ - Step 6904: {'lr': 0.0004986472483782096, 'samples': 1325568, 'steps': 6903, 'loss/train': 1.877648115158081} +11/06/2021 22:13:01 - INFO - __main__ - Step 6905: {'lr': 0.0004986466970146891, 'samples': 1325760, 'steps': 6904, 'loss/train': 1.900101900100708} +11/06/2021 22:13:01 - INFO - __main__ - Step 6906: {'lr': 0.0004986461455391323, 'samples': 1325952, 'steps': 6905, 'loss/train': 2.0257797241210938} +11/06/2021 22:13:02 - INFO - __main__ - Step 6907: {'lr': 0.0004986455939515395, 'samples': 1326144, 'steps': 6906, 'loss/train': 1.7874330282211304} +11/06/2021 22:13:02 - INFO - __main__ - Step 6908: {'lr': 0.0004986450422519107, 'samples': 1326336, 'steps': 6907, 'loss/train': 1.842711091041565} +11/06/2021 22:13:03 - INFO - __main__ - Step 6909: {'lr': 0.0004986444904402463, 'samples': 1326528, 'steps': 6908, 'loss/train': 2.1983108520507812} +11/06/2021 22:13:03 - INFO - __main__ - Step 6910: {'lr': 0.0004986439385165464, 'samples': 1326720, 'steps': 6909, 'loss/train': 1.821173906326294} +11/06/2021 22:13:04 - INFO - __main__ - Step 6911: {'lr': 0.0004986433864808115, 'samples': 1326912, 'steps': 6910, 'loss/train': 2.3128411769866943} +11/06/2021 22:13:04 - INFO - __main__ - Step 6912: {'lr': 0.0004986428343330418, 'samples': 1327104, 'steps': 6911, 'loss/train': 1.7972272634506226} +11/06/2021 22:13:05 - INFO - __main__ - Step 6913: {'lr': 0.0004986422820732375, 'samples': 1327296, 'steps': 6912, 'loss/train': 2.888493776321411} +11/06/2021 22:13:05 - INFO - __main__ - Step 6914: {'lr': 0.0004986417297013987, 'samples': 1327488, 'steps': 6913, 'loss/train': 1.6202863454818726} +11/06/2021 22:13:06 - INFO - __main__ - Step 6915: {'lr': 0.0004986411772175258, 'samples': 1327680, 'steps': 6914, 'loss/train': 1.704667329788208} +11/06/2021 22:13:06 - INFO - __main__ - Step 6916: {'lr': 0.000498640624621619, 'samples': 1327872, 'steps': 6915, 'loss/train': 1.571314811706543} +11/06/2021 22:13:07 - INFO - __main__ - Step 6917: {'lr': 0.0004986400719136786, 'samples': 1328064, 'steps': 6916, 'loss/train': 1.8842869997024536} +11/06/2021 22:13:07 - INFO - __main__ - Step 6918: {'lr': 0.0004986395190937048, 'samples': 1328256, 'steps': 6917, 'loss/train': 1.7865066528320312} +11/06/2021 22:13:08 - INFO - __main__ - Step 6919: {'lr': 0.000498638966161698, 'samples': 1328448, 'steps': 6918, 'loss/train': 1.9803627729415894} +11/06/2021 22:13:08 - INFO - __main__ - Step 6920: {'lr': 0.0004986384131176583, 'samples': 1328640, 'steps': 6919, 'loss/train': 2.02374529838562} +11/06/2021 22:13:09 - INFO - __main__ - Step 6921: {'lr': 0.0004986378599615858, 'samples': 1328832, 'steps': 6920, 'loss/train': 2.2463250160217285} +11/06/2021 22:13:09 - INFO - __main__ - Step 6922: {'lr': 0.000498637306693481, 'samples': 1329024, 'steps': 6921, 'loss/train': 1.9036977291107178} +11/06/2021 22:13:09 - INFO - __main__ - Step 6923: {'lr': 0.0004986367533133441, 'samples': 1329216, 'steps': 6922, 'loss/train': 1.8560709953308105} +11/06/2021 22:13:10 - INFO - __main__ - Step 6924: {'lr': 0.0004986361998211752, 'samples': 1329408, 'steps': 6923, 'loss/train': 1.860509991645813} +11/06/2021 22:13:11 - INFO - __main__ - Step 6925: {'lr': 0.0004986356462169748, 'samples': 1329600, 'steps': 6924, 'loss/train': 1.627434253692627} +11/06/2021 22:13:11 - INFO - __main__ - Step 6926: {'lr': 0.0004986350925007429, 'samples': 1329792, 'steps': 6925, 'loss/train': 1.9676358699798584} +11/06/2021 22:13:11 - INFO - __main__ - Step 6927: {'lr': 0.00049863453867248, 'samples': 1329984, 'steps': 6926, 'loss/train': 1.5846327543258667} +11/06/2021 22:13:12 - INFO - __main__ - Step 6928: {'lr': 0.0004986339847321862, 'samples': 1330176, 'steps': 6927, 'loss/train': 2.3178396224975586} +11/06/2021 22:13:13 - INFO - __main__ - Step 6929: {'lr': 0.0004986334306798616, 'samples': 1330368, 'steps': 6928, 'loss/train': 2.166189432144165} +11/06/2021 22:13:13 - INFO - __main__ - Step 6930: {'lr': 0.0004986328765155068, 'samples': 1330560, 'steps': 6929, 'loss/train': 2.235844373703003} +11/06/2021 22:13:13 - INFO - __main__ - Step 6931: {'lr': 0.0004986323222391217, 'samples': 1330752, 'steps': 6930, 'loss/train': 1.5991435050964355} +11/06/2021 22:13:14 - INFO - __main__ - Step 6932: {'lr': 0.0004986317678507069, 'samples': 1330944, 'steps': 6931, 'loss/train': 1.773486852645874} +11/06/2021 22:13:14 - INFO - __main__ - Step 6933: {'lr': 0.0004986312133502623, 'samples': 1331136, 'steps': 6932, 'loss/train': 0.26625779271125793} +11/06/2021 22:13:15 - INFO - __main__ - Step 6934: {'lr': 0.0004986306587377884, 'samples': 1331328, 'steps': 6933, 'loss/train': 1.767874836921692} +11/06/2021 22:13:16 - INFO - __main__ - Step 6935: {'lr': 0.0004986301040132853, 'samples': 1331520, 'steps': 6934, 'loss/train': 1.564034342765808} +11/06/2021 22:13:16 - INFO - __main__ - Step 6936: {'lr': 0.0004986295491767533, 'samples': 1331712, 'steps': 6935, 'loss/train': 1.7570186853408813} +11/06/2021 22:13:16 - INFO - __main__ - Step 6937: {'lr': 0.0004986289942281927, 'samples': 1331904, 'steps': 6936, 'loss/train': 1.7670789957046509} +11/06/2021 22:13:17 - INFO - __main__ - Step 6938: {'lr': 0.0004986284391676037, 'samples': 1332096, 'steps': 6937, 'loss/train': 2.3007538318634033} +11/06/2021 22:13:18 - INFO - __main__ - Step 6939: {'lr': 0.0004986278839949866, 'samples': 1332288, 'steps': 6938, 'loss/train': 2.0607035160064697} +11/06/2021 22:13:18 - INFO - __main__ - Step 6940: {'lr': 0.0004986273287103416, 'samples': 1332480, 'steps': 6939, 'loss/train': 2.072021484375} +11/06/2021 22:13:18 - INFO - __main__ - Step 6941: {'lr': 0.0004986267733136689, 'samples': 1332672, 'steps': 6940, 'loss/train': 1.5899384021759033} +11/06/2021 22:13:19 - INFO - __main__ - Step 6942: {'lr': 0.0004986262178049689, 'samples': 1332864, 'steps': 6941, 'loss/train': 2.349639415740967} +11/06/2021 22:13:19 - INFO - __main__ - Step 6943: {'lr': 0.0004986256621842417, 'samples': 1333056, 'steps': 6942, 'loss/train': 1.3075493574142456} +11/06/2021 22:13:20 - INFO - __main__ - Step 6944: {'lr': 0.0004986251064514878, 'samples': 1333248, 'steps': 6943, 'loss/train': 1.4353903532028198} +11/06/2021 22:13:21 - INFO - __main__ - Step 6945: {'lr': 0.000498624550606707, 'samples': 1333440, 'steps': 6944, 'loss/train': 2.1542229652404785} +11/06/2021 22:13:21 - INFO - __main__ - Step 6946: {'lr': 0.0004986239946498999, 'samples': 1333632, 'steps': 6945, 'loss/train': 1.9125726222991943} +11/06/2021 22:13:21 - INFO - __main__ - Step 6947: {'lr': 0.0004986234385810668, 'samples': 1333824, 'steps': 6946, 'loss/train': 1.9208937883377075} +11/06/2021 22:13:22 - INFO - __main__ - Step 6948: {'lr': 0.0004986228824002076, 'samples': 1334016, 'steps': 6947, 'loss/train': 1.7958143949508667} +11/06/2021 22:13:23 - INFO - __main__ - Step 6949: {'lr': 0.0004986223261073228, 'samples': 1334208, 'steps': 6948, 'loss/train': 2.022138833999634} +11/06/2021 22:13:23 - INFO - __main__ - Step 6950: {'lr': 0.0004986217697024128, 'samples': 1334400, 'steps': 6949, 'loss/train': 2.049771785736084} +11/06/2021 22:13:23 - INFO - __main__ - Step 6951: {'lr': 0.0004986212131854775, 'samples': 1334592, 'steps': 6950, 'loss/train': 1.7569395303726196} +11/06/2021 22:13:24 - INFO - __main__ - Step 6952: {'lr': 0.0004986206565565173, 'samples': 1334784, 'steps': 6951, 'loss/train': 1.6181141138076782} +11/06/2021 22:13:24 - INFO - __main__ - Step 6953: {'lr': 0.0004986200998155325, 'samples': 1334976, 'steps': 6952, 'loss/train': 2.3144214153289795} +11/06/2021 22:13:24 - INFO - __main__ - Step 6954: {'lr': 0.0004986195429625234, 'samples': 1335168, 'steps': 6953, 'loss/train': 1.8186416625976562} +11/06/2021 22:13:25 - INFO - __main__ - Step 6955: {'lr': 0.0004986189859974901, 'samples': 1335360, 'steps': 6954, 'loss/train': 1.4414639472961426} +11/06/2021 22:13:26 - INFO - __main__ - Step 6956: {'lr': 0.000498618428920433, 'samples': 1335552, 'steps': 6955, 'loss/train': 1.4519563913345337} +11/06/2021 22:13:26 - INFO - __main__ - Step 6957: {'lr': 0.0004986178717313522, 'samples': 1335744, 'steps': 6956, 'loss/train': 1.7825121879577637} +11/06/2021 22:13:26 - INFO - __main__ - Step 6958: {'lr': 0.000498617314430248, 'samples': 1335936, 'steps': 6957, 'loss/train': 2.2233121395111084} +11/06/2021 22:13:27 - INFO - __main__ - Step 6959: {'lr': 0.0004986167570171208, 'samples': 1336128, 'steps': 6958, 'loss/train': 2.0718345642089844} +11/06/2021 22:13:28 - INFO - __main__ - Step 6960: {'lr': 0.0004986161994919706, 'samples': 1336320, 'steps': 6959, 'loss/train': 1.547726035118103} +11/06/2021 22:13:28 - INFO - __main__ - Step 6961: {'lr': 0.0004986156418547978, 'samples': 1336512, 'steps': 6960, 'loss/train': 2.062274694442749} +11/06/2021 22:13:29 - INFO - __main__ - Step 6962: {'lr': 0.0004986150841056027, 'samples': 1336704, 'steps': 6961, 'loss/train': 2.067039966583252} +11/06/2021 22:13:29 - INFO - __main__ - Step 6963: {'lr': 0.0004986145262443854, 'samples': 1336896, 'steps': 6962, 'loss/train': 1.8536887168884277} +11/06/2021 22:13:29 - INFO - __main__ - Step 6964: {'lr': 0.0004986139682711463, 'samples': 1337088, 'steps': 6963, 'loss/train': 2.060143232345581} +11/06/2021 22:13:31 - INFO - __main__ - Step 6965: {'lr': 0.0004986134101858854, 'samples': 1337280, 'steps': 6964, 'loss/train': 1.9564449787139893} +11/06/2021 22:13:31 - INFO - __main__ - Step 6966: {'lr': 0.0004986128519886033, 'samples': 1337472, 'steps': 6965, 'loss/train': 2.0002098083496094} +11/06/2021 22:13:31 - INFO - __main__ - Step 6967: {'lr': 0.0004986122936793, 'samples': 1337664, 'steps': 6966, 'loss/train': 1.0394262075424194} +11/06/2021 22:13:32 - INFO - __main__ - Step 6968: {'lr': 0.000498611735257976, 'samples': 1337856, 'steps': 6967, 'loss/train': 1.8004080057144165} +11/06/2021 22:13:32 - INFO - __main__ - Step 6969: {'lr': 0.0004986111767246313, 'samples': 1338048, 'steps': 6968, 'loss/train': 1.8207870721817017} +11/06/2021 22:13:33 - INFO - __main__ - Step 6970: {'lr': 0.0004986106180792662, 'samples': 1338240, 'steps': 6969, 'loss/train': 2.2126078605651855} +11/06/2021 22:13:33 - INFO - __main__ - Step 6971: {'lr': 0.000498610059321881, 'samples': 1338432, 'steps': 6970, 'loss/train': 1.8455476760864258} +11/06/2021 22:13:34 - INFO - __main__ - Step 6972: {'lr': 0.000498609500452476, 'samples': 1338624, 'steps': 6971, 'loss/train': 1.8543205261230469} +11/06/2021 22:13:34 - INFO - __main__ - Step 6973: {'lr': 0.0004986089414710513, 'samples': 1338816, 'steps': 6972, 'loss/train': 2.0430335998535156} +11/06/2021 22:13:35 - INFO - __main__ - Step 6974: {'lr': 0.0004986083823776073, 'samples': 1339008, 'steps': 6973, 'loss/train': 1.9079920053482056} +11/06/2021 22:13:35 - INFO - __main__ - Step 6975: {'lr': 0.0004986078231721443, 'samples': 1339200, 'steps': 6974, 'loss/train': 0.6376028060913086} +11/06/2021 22:13:36 - INFO - __main__ - Step 6976: {'lr': 0.0004986072638546623, 'samples': 1339392, 'steps': 6975, 'loss/train': 1.7745708227157593} +11/06/2021 22:13:36 - INFO - __main__ - Step 6977: {'lr': 0.0004986067044251617, 'samples': 1339584, 'steps': 6976, 'loss/train': 2.010833740234375} +11/06/2021 22:13:37 - INFO - __main__ - Step 6978: {'lr': 0.0004986061448836428, 'samples': 1339776, 'steps': 6977, 'loss/train': 1.629277229309082} +11/06/2021 22:13:37 - INFO - __main__ - Step 6979: {'lr': 0.0004986055852301058, 'samples': 1339968, 'steps': 6978, 'loss/train': 1.9664230346679688} +11/06/2021 22:13:39 - INFO - __main__ - Step 6980: {'lr': 0.000498605025464551, 'samples': 1340160, 'steps': 6979, 'loss/train': 1.915958046913147} +11/06/2021 22:13:39 - INFO - __main__ - Step 6981: {'lr': 0.0004986044655869786, 'samples': 1340352, 'steps': 6980, 'loss/train': 1.7974884510040283} +11/06/2021 22:13:40 - INFO - __main__ - Step 6982: {'lr': 0.0004986039055973889, 'samples': 1340544, 'steps': 6981, 'loss/train': 1.9128649234771729} +11/06/2021 22:13:40 - INFO - __main__ - Step 6983: {'lr': 0.000498603345495782, 'samples': 1340736, 'steps': 6982, 'loss/train': 1.8619794845581055} +11/06/2021 22:13:40 - INFO - __main__ - Step 6984: {'lr': 0.0004986027852821583, 'samples': 1340928, 'steps': 6983, 'loss/train': 1.3572192192077637} +11/06/2021 22:13:41 - INFO - __main__ - Step 6985: {'lr': 0.000498602224956518, 'samples': 1341120, 'steps': 6984, 'loss/train': 1.4499187469482422} +11/06/2021 22:13:41 - INFO - __main__ - Step 6986: {'lr': 0.0004986016645188615, 'samples': 1341312, 'steps': 6985, 'loss/train': 1.4657028913497925} +11/06/2021 22:13:41 - INFO - __main__ - Step 6987: {'lr': 0.0004986011039691889, 'samples': 1341504, 'steps': 6986, 'loss/train': 2.016274929046631} +11/06/2021 22:13:43 - INFO - __main__ - Step 6988: {'lr': 0.0004986005433075004, 'samples': 1341696, 'steps': 6987, 'loss/train': 2.058478355407715} +11/06/2021 22:13:43 - INFO - __main__ - Step 6989: {'lr': 0.0004985999825337964, 'samples': 1341888, 'steps': 6988, 'loss/train': 2.3388593196868896} +11/06/2021 22:13:43 - INFO - __main__ - Step 6990: {'lr': 0.000498599421648077, 'samples': 1342080, 'steps': 6989, 'loss/train': 1.34577214717865} +11/06/2021 22:13:44 - INFO - __main__ - Step 6991: {'lr': 0.0004985988606503426, 'samples': 1342272, 'steps': 6990, 'loss/train': 1.556723713874817} +11/06/2021 22:13:44 - INFO - __main__ - Step 6992: {'lr': 0.0004985982995405933, 'samples': 1342464, 'steps': 6991, 'loss/train': 1.9663342237472534} +11/06/2021 22:13:45 - INFO - __main__ - Step 6993: {'lr': 0.0004985977383188296, 'samples': 1342656, 'steps': 6992, 'loss/train': 1.9654285907745361} +11/06/2021 22:13:45 - INFO - __main__ - Step 6994: {'lr': 0.0004985971769850515, 'samples': 1342848, 'steps': 6993, 'loss/train': 1.9241557121276855} +11/06/2021 22:13:46 - INFO - __main__ - Step 6995: {'lr': 0.0004985966155392593, 'samples': 1343040, 'steps': 6994, 'loss/train': 2.185478687286377} +11/06/2021 22:13:46 - INFO - __main__ - Step 6996: {'lr': 0.0004985960539814534, 'samples': 1343232, 'steps': 6995, 'loss/train': 1.901774287223816} +11/06/2021 22:13:46 - INFO - __main__ - Step 6997: {'lr': 0.000498595492311634, 'samples': 1343424, 'steps': 6996, 'loss/train': 1.8927873373031616} +11/06/2021 22:13:47 - INFO - __main__ - Step 6998: {'lr': 0.0004985949305298012, 'samples': 1343616, 'steps': 6997, 'loss/train': 1.5036976337432861} +11/06/2021 22:13:48 - INFO - __main__ - Step 6999: {'lr': 0.0004985943686359554, 'samples': 1343808, 'steps': 6998, 'loss/train': 2.1838197708129883} +11/06/2021 22:13:48 - INFO - __main__ - Step 7000: {'lr': 0.0004985938066300968, 'samples': 1344000, 'steps': 6999, 'loss/train': 1.8023282289505005} +11/06/2021 22:13:48 - INFO - __main__ - Step 7001: {'lr': 0.0004985932445122257, 'samples': 1344192, 'steps': 7000, 'loss/train': 0.9377233982086182} +11/06/2021 22:13:49 - INFO - __main__ - Step 7002: {'lr': 0.0004985926822823422, 'samples': 1344384, 'steps': 7001, 'loss/train': 2.0790352821350098} +11/06/2021 22:13:49 - INFO - __main__ - Step 7003: {'lr': 0.0004985921199404467, 'samples': 1344576, 'steps': 7002, 'loss/train': 1.5738434791564941} +11/06/2021 22:13:50 - INFO - __main__ - Step 7004: {'lr': 0.0004985915574865395, 'samples': 1344768, 'steps': 7003, 'loss/train': 2.0488102436065674} +11/06/2021 22:13:50 - INFO - __main__ - Step 7005: {'lr': 0.0004985909949206209, 'samples': 1344960, 'steps': 7004, 'loss/train': 2.2131500244140625} +11/06/2021 22:13:51 - INFO - __main__ - Step 7006: {'lr': 0.0004985904322426909, 'samples': 1345152, 'steps': 7005, 'loss/train': 2.16741681098938} +11/06/2021 22:13:51 - INFO - __main__ - Step 7007: {'lr': 0.0004985898694527498, 'samples': 1345344, 'steps': 7006, 'loss/train': 1.9892717599868774} +11/06/2021 22:13:52 - INFO - __main__ - Step 7008: {'lr': 0.000498589306550798, 'samples': 1345536, 'steps': 7007, 'loss/train': 1.8207341432571411} +11/06/2021 22:13:53 - INFO - __main__ - Step 7009: {'lr': 0.0004985887435368357, 'samples': 1345728, 'steps': 7008, 'loss/train': 2.600703716278076} +11/06/2021 22:13:53 - INFO - __main__ - Step 7010: {'lr': 0.0004985881804108632, 'samples': 1345920, 'steps': 7009, 'loss/train': 1.830875277519226} +11/06/2021 22:13:53 - INFO - __main__ - Step 7011: {'lr': 0.0004985876171728807, 'samples': 1346112, 'steps': 7010, 'loss/train': 1.6429589986801147} +11/06/2021 22:13:54 - INFO - __main__ - Step 7012: {'lr': 0.0004985870538228884, 'samples': 1346304, 'steps': 7011, 'loss/train': 1.831001877784729} +11/06/2021 22:13:54 - INFO - __main__ - Step 7013: {'lr': 0.0004985864903608866, 'samples': 1346496, 'steps': 7012, 'loss/train': 1.9762578010559082} +11/06/2021 22:13:55 - INFO - __main__ - Step 7014: {'lr': 0.0004985859267868756, 'samples': 1346688, 'steps': 7013, 'loss/train': 2.1162519454956055} +11/06/2021 22:13:55 - INFO - __main__ - Step 7015: {'lr': 0.0004985853631008557, 'samples': 1346880, 'steps': 7014, 'loss/train': 1.9965474605560303} +11/06/2021 22:13:56 - INFO - __main__ - Step 7016: {'lr': 0.000498584799302827, 'samples': 1347072, 'steps': 7015, 'loss/train': 1.330285906791687} +11/06/2021 22:13:56 - INFO - __main__ - Step 7017: {'lr': 0.0004985842353927897, 'samples': 1347264, 'steps': 7016, 'loss/train': 1.870910406112671} +11/06/2021 22:13:57 - INFO - __main__ - Step 7018: {'lr': 0.0004985836713707443, 'samples': 1347456, 'steps': 7017, 'loss/train': 2.007260799407959} +11/06/2021 22:13:58 - INFO - __main__ - Step 7019: {'lr': 0.000498583107236691, 'samples': 1347648, 'steps': 7018, 'loss/train': 1.9178532361984253} +11/06/2021 22:13:58 - INFO - __main__ - Step 7020: {'lr': 0.0004985825429906299, 'samples': 1347840, 'steps': 7019, 'loss/train': 1.8477237224578857} +11/06/2021 22:13:58 - INFO - __main__ - Step 7021: {'lr': 0.0004985819786325614, 'samples': 1348032, 'steps': 7020, 'loss/train': 1.7012065649032593} +11/06/2021 22:13:59 - INFO - __main__ - Step 7022: {'lr': 0.0004985814141624856, 'samples': 1348224, 'steps': 7021, 'loss/train': 1.9966686964035034} +11/06/2021 22:13:59 - INFO - __main__ - Step 7023: {'lr': 0.000498580849580403, 'samples': 1348416, 'steps': 7022, 'loss/train': 1.7305803298950195} +11/06/2021 22:13:59 - INFO - __main__ - Step 7024: {'lr': 0.0004985802848863135, 'samples': 1348608, 'steps': 7023, 'loss/train': 2.0270166397094727} +11/06/2021 22:14:00 - INFO - __main__ - Step 7025: {'lr': 0.0004985797200802176, 'samples': 1348800, 'steps': 7024, 'loss/train': 2.123034715652466} +11/06/2021 22:14:01 - INFO - __main__ - Step 7026: {'lr': 0.0004985791551621158, 'samples': 1348992, 'steps': 7025, 'loss/train': 1.589381456375122} +11/06/2021 22:14:01 - INFO - __main__ - Step 7027: {'lr': 0.0004985785901320078, 'samples': 1349184, 'steps': 7026, 'loss/train': 1.8792399168014526} +11/06/2021 22:14:02 - INFO - __main__ - Step 7028: {'lr': 0.0004985780249898941, 'samples': 1349376, 'steps': 7027, 'loss/train': 1.8955899477005005} +11/06/2021 22:14:02 - INFO - __main__ - Step 7029: {'lr': 0.0004985774597357751, 'samples': 1349568, 'steps': 7028, 'loss/train': 2.0755574703216553} +11/06/2021 22:14:03 - INFO - __main__ - Step 7030: {'lr': 0.0004985768943696509, 'samples': 1349760, 'steps': 7029, 'loss/train': 1.896838903427124} +11/06/2021 22:14:03 - INFO - __main__ - Step 7031: {'lr': 0.0004985763288915217, 'samples': 1349952, 'steps': 7030, 'loss/train': 2.0868396759033203} +11/06/2021 22:14:04 - INFO - __main__ - Step 7032: {'lr': 0.0004985757633013879, 'samples': 1350144, 'steps': 7031, 'loss/train': 1.9611470699310303} +11/06/2021 22:14:04 - INFO - __main__ - Step 7033: {'lr': 0.0004985751975992497, 'samples': 1350336, 'steps': 7032, 'loss/train': 2.039046287536621} +11/06/2021 22:14:04 - INFO - __main__ - Step 7034: {'lr': 0.0004985746317851074, 'samples': 1350528, 'steps': 7033, 'loss/train': 2.1592774391174316} +11/06/2021 22:14:05 - INFO - __main__ - Step 7035: {'lr': 0.0004985740658589612, 'samples': 1350720, 'steps': 7034, 'loss/train': 1.7554975748062134} +11/06/2021 22:14:06 - INFO - __main__ - Step 7036: {'lr': 0.0004985734998208112, 'samples': 1350912, 'steps': 7035, 'loss/train': 1.64145028591156} +11/06/2021 22:14:06 - INFO - __main__ - Step 7037: {'lr': 0.000498572933670658, 'samples': 1351104, 'steps': 7036, 'loss/train': 1.8642250299453735} +11/06/2021 22:14:06 - INFO - __main__ - Step 7038: {'lr': 0.0004985723674085016, 'samples': 1351296, 'steps': 7037, 'loss/train': 1.789941430091858} +11/06/2021 22:14:07 - INFO - __main__ - Step 7039: {'lr': 0.0004985718010343424, 'samples': 1351488, 'steps': 7038, 'loss/train': 2.0578839778900146} +11/06/2021 22:14:08 - INFO - __main__ - Step 7040: {'lr': 0.0004985712345481805, 'samples': 1351680, 'steps': 7039, 'loss/train': 1.8973031044006348} +11/06/2021 22:14:08 - INFO - __main__ - Step 7041: {'lr': 0.0004985706679500163, 'samples': 1351872, 'steps': 7040, 'loss/train': 2.2261483669281006} +11/06/2021 22:14:08 - INFO - __main__ - Step 7042: {'lr': 0.0004985701012398499, 'samples': 1352064, 'steps': 7041, 'loss/train': 2.026362657546997} +11/06/2021 22:14:09 - INFO - __main__ - Step 7043: {'lr': 0.0004985695344176817, 'samples': 1352256, 'steps': 7042, 'loss/train': 2.370086669921875} +11/06/2021 22:14:09 - INFO - __main__ - Step 7044: {'lr': 0.0004985689674835119, 'samples': 1352448, 'steps': 7043, 'loss/train': 1.789720058441162} +11/06/2021 22:14:10 - INFO - __main__ - Step 7045: {'lr': 0.0004985684004373409, 'samples': 1352640, 'steps': 7044, 'loss/train': 1.5516489744186401} +11/06/2021 22:14:10 - INFO - __main__ - Step 7046: {'lr': 0.0004985678332791686, 'samples': 1352832, 'steps': 7045, 'loss/train': 1.1448746919631958} +11/06/2021 22:14:11 - INFO - __main__ - Step 7047: {'lr': 0.0004985672660089956, 'samples': 1353024, 'steps': 7046, 'loss/train': 1.9174386262893677} +11/06/2021 22:14:11 - INFO - __main__ - Step 7048: {'lr': 0.000498566698626822, 'samples': 1353216, 'steps': 7047, 'loss/train': 2.0857248306274414} +11/06/2021 22:14:12 - INFO - __main__ - Step 7049: {'lr': 0.000498566131132648, 'samples': 1353408, 'steps': 7048, 'loss/train': 1.5200681686401367} +11/06/2021 22:14:13 - INFO - __main__ - Step 7050: {'lr': 0.0004985655635264739, 'samples': 1353600, 'steps': 7049, 'loss/train': 2.0432159900665283} +11/06/2021 22:14:13 - INFO - __main__ - Step 7051: {'lr': 0.0004985649958083001, 'samples': 1353792, 'steps': 7050, 'loss/train': 2.034838914871216} +11/06/2021 22:14:13 - INFO - __main__ - Step 7052: {'lr': 0.0004985644279781268, 'samples': 1353984, 'steps': 7051, 'loss/train': 2.010187864303589} +11/06/2021 22:14:14 - INFO - __main__ - Step 7053: {'lr': 0.0004985638600359542, 'samples': 1354176, 'steps': 7052, 'loss/train': 2.2024543285369873} +11/06/2021 22:14:14 - INFO - __main__ - Step 7054: {'lr': 0.0004985632919817824, 'samples': 1354368, 'steps': 7053, 'loss/train': 2.1596481800079346} +11/06/2021 22:14:14 - INFO - __main__ - Step 7055: {'lr': 0.000498562723815612, 'samples': 1354560, 'steps': 7054, 'loss/train': 1.9444608688354492} +11/06/2021 22:14:15 - INFO - __main__ - Step 7056: {'lr': 0.000498562155537443, 'samples': 1354752, 'steps': 7055, 'loss/train': 1.5930293798446655} +11/06/2021 22:14:16 - INFO - __main__ - Step 7057: {'lr': 0.0004985615871472757, 'samples': 1354944, 'steps': 7056, 'loss/train': 2.356843948364258} +11/06/2021 22:14:16 - INFO - __main__ - Step 7058: {'lr': 0.0004985610186451104, 'samples': 1355136, 'steps': 7057, 'loss/train': 2.400442123413086} +11/06/2021 22:14:16 - INFO - __main__ - Step 7059: {'lr': 0.0004985604500309473, 'samples': 1355328, 'steps': 7058, 'loss/train': 1.9683334827423096} +11/06/2021 22:14:17 - INFO - __main__ - Step 7060: {'lr': 0.0004985598813047868, 'samples': 1355520, 'steps': 7059, 'loss/train': 2.3564374446868896} +11/06/2021 22:14:18 - INFO - __main__ - Step 7061: {'lr': 0.000498559312466629, 'samples': 1355712, 'steps': 7060, 'loss/train': 2.06729793548584} +11/06/2021 22:14:18 - INFO - __main__ - Step 7062: {'lr': 0.0004985587435164742, 'samples': 1355904, 'steps': 7061, 'loss/train': 2.2818222045898438} +11/06/2021 22:14:19 - INFO - __main__ - Step 7063: {'lr': 0.0004985581744543226, 'samples': 1356096, 'steps': 7062, 'loss/train': 2.8262219429016113} +11/06/2021 22:14:19 - INFO - __main__ - Step 7064: {'lr': 0.0004985576052801747, 'samples': 1356288, 'steps': 7063, 'loss/train': 2.252566337585449} +11/06/2021 22:14:19 - INFO - __main__ - Step 7065: {'lr': 0.0004985570359940304, 'samples': 1356480, 'steps': 7064, 'loss/train': 1.9672572612762451} +11/06/2021 22:14:20 - INFO - __main__ - Step 7066: {'lr': 0.0004985564665958901, 'samples': 1356672, 'steps': 7065, 'loss/train': 1.8801449537277222} +11/06/2021 22:14:21 - INFO - __main__ - Step 7067: {'lr': 0.0004985558970857543, 'samples': 1356864, 'steps': 7066, 'loss/train': 2.165799379348755} +11/06/2021 22:14:21 - INFO - __main__ - Step 7068: {'lr': 0.000498555327463623, 'samples': 1357056, 'steps': 7067, 'loss/train': 1.7966886758804321} +11/06/2021 22:14:21 - INFO - __main__ - Step 7069: {'lr': 0.0004985547577294963, 'samples': 1357248, 'steps': 7068, 'loss/train': 1.4728955030441284} +11/06/2021 22:14:22 - INFO - __main__ - Step 7070: {'lr': 0.0004985541878833749, 'samples': 1357440, 'steps': 7069, 'loss/train': 1.446349024772644} +11/06/2021 22:14:23 - INFO - __main__ - Step 7071: {'lr': 0.0004985536179252587, 'samples': 1357632, 'steps': 7070, 'loss/train': 1.8138748407363892} +11/06/2021 22:14:23 - INFO - __main__ - Step 7072: {'lr': 0.0004985530478551481, 'samples': 1357824, 'steps': 7071, 'loss/train': 1.72260582447052} +11/06/2021 22:14:23 - INFO - __main__ - Step 7073: {'lr': 0.0004985524776730434, 'samples': 1358016, 'steps': 7072, 'loss/train': 2.2067058086395264} +11/06/2021 22:14:24 - INFO - __main__ - Step 7074: {'lr': 0.0004985519073789447, 'samples': 1358208, 'steps': 7073, 'loss/train': 2.0647716522216797} +11/06/2021 22:14:24 - INFO - __main__ - Step 7075: {'lr': 0.0004985513369728524, 'samples': 1358400, 'steps': 7074, 'loss/train': 1.755244255065918} +11/06/2021 22:14:26 - INFO - __main__ - Step 7076: {'lr': 0.0004985507664547666, 'samples': 1358592, 'steps': 7075, 'loss/train': 2.965153455734253} +11/06/2021 22:14:26 - INFO - __main__ - Step 7077: {'lr': 0.0004985501958246878, 'samples': 1358784, 'steps': 7076, 'loss/train': 2.4291107654571533} +11/06/2021 22:14:26 - INFO - __main__ - Step 7078: {'lr': 0.000498549625082616, 'samples': 1358976, 'steps': 7077, 'loss/train': 1.5984909534454346} +11/06/2021 22:14:27 - INFO - __main__ - Step 7079: {'lr': 0.0004985490542285516, 'samples': 1359168, 'steps': 7078, 'loss/train': 2.098381519317627} +11/06/2021 22:14:27 - INFO - __main__ - Step 7080: {'lr': 0.0004985484832624949, 'samples': 1359360, 'steps': 7079, 'loss/train': 1.983779788017273} +11/06/2021 22:14:27 - INFO - __main__ - Step 7081: {'lr': 0.000498547912184446, 'samples': 1359552, 'steps': 7080, 'loss/train': 2.0644752979278564} +11/06/2021 22:14:28 - INFO - __main__ - Step 7082: {'lr': 0.0004985473409944054, 'samples': 1359744, 'steps': 7081, 'loss/train': 1.7944436073303223} +11/06/2021 22:14:29 - INFO - __main__ - Step 7083: {'lr': 0.000498546769692373, 'samples': 1359936, 'steps': 7082, 'loss/train': 2.2252354621887207} +11/06/2021 22:14:29 - INFO - __main__ - Step 7084: {'lr': 0.0004985461982783494, 'samples': 1360128, 'steps': 7083, 'loss/train': 1.653979778289795} +11/06/2021 22:14:30 - INFO - __main__ - Step 7085: {'lr': 0.0004985456267523346, 'samples': 1360320, 'steps': 7084, 'loss/train': 1.65984308719635} +11/06/2021 22:14:30 - INFO - __main__ - Step 7086: {'lr': 0.0004985450551143291, 'samples': 1360512, 'steps': 7085, 'loss/train': 2.264176607131958} +11/06/2021 22:14:31 - INFO - __main__ - Step 7087: {'lr': 0.000498544483364333, 'samples': 1360704, 'steps': 7086, 'loss/train': 2.1907835006713867} +11/06/2021 22:14:31 - INFO - __main__ - Step 7088: {'lr': 0.0004985439115023465, 'samples': 1360896, 'steps': 7087, 'loss/train': 1.8847299814224243} +11/06/2021 22:14:32 - INFO - __main__ - Step 7089: {'lr': 0.0004985433395283701, 'samples': 1361088, 'steps': 7088, 'loss/train': 1.9816615581512451} +11/06/2021 22:14:32 - INFO - __main__ - Step 7090: {'lr': 0.0004985427674424038, 'samples': 1361280, 'steps': 7089, 'loss/train': 1.8997712135314941} +11/06/2021 22:14:32 - INFO - __main__ - Step 7091: {'lr': 0.000498542195244448, 'samples': 1361472, 'steps': 7090, 'loss/train': 1.139441967010498} +11/06/2021 22:14:33 - INFO - __main__ - Step 7092: {'lr': 0.0004985416229345029, 'samples': 1361664, 'steps': 7091, 'loss/train': 1.571520209312439} +11/06/2021 22:14:34 - INFO - __main__ - Step 7093: {'lr': 0.0004985410505125689, 'samples': 1361856, 'steps': 7092, 'loss/train': 2.138139486312866} +11/06/2021 22:14:34 - INFO - __main__ - Step 7094: {'lr': 0.0004985404779786459, 'samples': 1362048, 'steps': 7093, 'loss/train': 2.261357545852661} +11/06/2021 22:14:35 - INFO - __main__ - Step 7095: {'lr': 0.0004985399053327346, 'samples': 1362240, 'steps': 7094, 'loss/train': 1.7595309019088745} +11/06/2021 22:14:35 - INFO - __main__ - Step 7096: {'lr': 0.000498539332574835, 'samples': 1362432, 'steps': 7095, 'loss/train': 1.8926126956939697} +11/06/2021 22:14:35 - INFO - __main__ - Step 7097: {'lr': 0.0004985387597049474, 'samples': 1362624, 'steps': 7096, 'loss/train': 2.004615306854248} +11/06/2021 22:14:37 - INFO - __main__ - Step 7098: {'lr': 0.0004985381867230721, 'samples': 1362816, 'steps': 7097, 'loss/train': 1.6198385953903198} +11/06/2021 22:14:37 - INFO - __main__ - Step 7099: {'lr': 0.0004985376136292093, 'samples': 1363008, 'steps': 7098, 'loss/train': 1.9833897352218628} +11/06/2021 22:14:37 - INFO - __main__ - Step 7100: {'lr': 0.0004985370404233592, 'samples': 1363200, 'steps': 7099, 'loss/train': 1.9819221496582031} +11/06/2021 22:14:38 - INFO - __main__ - Step 7101: {'lr': 0.0004985364671055223, 'samples': 1363392, 'steps': 7100, 'loss/train': 2.0017964839935303} +11/06/2021 22:14:38 - INFO - __main__ - Step 7102: {'lr': 0.0004985358936756985, 'samples': 1363584, 'steps': 7101, 'loss/train': 1.8916939496994019} +11/06/2021 22:14:38 - INFO - __main__ - Step 7103: {'lr': 0.0004985353201338885, 'samples': 1363776, 'steps': 7102, 'loss/train': 1.6781333684921265} +11/06/2021 22:14:39 - INFO - __main__ - Step 7104: {'lr': 0.0004985347464800921, 'samples': 1363968, 'steps': 7103, 'loss/train': 0.41633597016334534} +11/06/2021 22:14:40 - INFO - __main__ - Step 7105: {'lr': 0.0004985341727143099, 'samples': 1364160, 'steps': 7104, 'loss/train': 1.5315263271331787} +11/06/2021 22:14:40 - INFO - __main__ - Step 7106: {'lr': 0.000498533598836542, 'samples': 1364352, 'steps': 7105, 'loss/train': 1.2057009935379028} +11/06/2021 22:14:40 - INFO - __main__ - Step 7107: {'lr': 0.0004985330248467888, 'samples': 1364544, 'steps': 7106, 'loss/train': 1.7681790590286255} +11/06/2021 22:14:41 - INFO - __main__ - Step 7108: {'lr': 0.0004985324507450504, 'samples': 1364736, 'steps': 7107, 'loss/train': 1.7636619806289673} +11/06/2021 22:14:42 - INFO - __main__ - Step 7109: {'lr': 0.000498531876531327, 'samples': 1364928, 'steps': 7108, 'loss/train': 1.970746397972107} +11/06/2021 22:14:42 - INFO - __main__ - Step 7110: {'lr': 0.0004985313022056191, 'samples': 1365120, 'steps': 7109, 'loss/train': 1.8806291818618774} +11/06/2021 22:14:43 - INFO - __main__ - Step 7111: {'lr': 0.0004985307277679267, 'samples': 1365312, 'steps': 7110, 'loss/train': 1.3008683919906616} +11/06/2021 22:14:43 - INFO - __main__ - Step 7112: {'lr': 0.0004985301532182503, 'samples': 1365504, 'steps': 7111, 'loss/train': 1.9515055418014526} +11/06/2021 22:14:43 - INFO - __main__ - Step 7113: {'lr': 0.0004985295785565901, 'samples': 1365696, 'steps': 7112, 'loss/train': 1.8485970497131348} +11/06/2021 22:14:44 - INFO - __main__ - Step 7114: {'lr': 0.0004985290037829462, 'samples': 1365888, 'steps': 7113, 'loss/train': 3.7923812866210938} +11/06/2021 22:14:45 - INFO - __main__ - Step 7115: {'lr': 0.000498528428897319, 'samples': 1366080, 'steps': 7114, 'loss/train': 1.5386725664138794} +11/06/2021 22:14:45 - INFO - __main__ - Step 7116: {'lr': 0.0004985278538997088, 'samples': 1366272, 'steps': 7115, 'loss/train': 2.0282657146453857} +11/06/2021 22:14:45 - INFO - __main__ - Step 7117: {'lr': 0.0004985272787901156, 'samples': 1366464, 'steps': 7116, 'loss/train': 2.3269381523132324} +11/06/2021 22:14:46 - INFO - __main__ - Step 7118: {'lr': 0.00049852670356854, 'samples': 1366656, 'steps': 7117, 'loss/train': 1.7581599950790405} +11/06/2021 22:14:47 - INFO - __main__ - Step 7119: {'lr': 0.000498526128234982, 'samples': 1366848, 'steps': 7118, 'loss/train': 2.1720402240753174} +11/06/2021 22:14:47 - INFO - __main__ - Step 7120: {'lr': 0.000498525552789442, 'samples': 1367040, 'steps': 7119, 'loss/train': 1.491886019706726} +11/06/2021 22:14:48 - INFO - __main__ - Step 7121: {'lr': 0.0004985249772319202, 'samples': 1367232, 'steps': 7120, 'loss/train': 2.0638139247894287} +11/06/2021 22:14:48 - INFO - __main__ - Step 7122: {'lr': 0.000498524401562417, 'samples': 1367424, 'steps': 7121, 'loss/train': 1.7350369691848755} +11/06/2021 22:14:48 - INFO - __main__ - Step 7123: {'lr': 0.0004985238257809325, 'samples': 1367616, 'steps': 7122, 'loss/train': 2.518477201461792} +11/06/2021 22:14:49 - INFO - __main__ - Step 7124: {'lr': 0.0004985232498874669, 'samples': 1367808, 'steps': 7123, 'loss/train': 1.7711327075958252} +11/06/2021 22:14:50 - INFO - __main__ - Step 7125: {'lr': 0.0004985226738820207, 'samples': 1368000, 'steps': 7124, 'loss/train': 1.2557427883148193} +11/06/2021 22:14:50 - INFO - __main__ - Step 7126: {'lr': 0.0004985220977645939, 'samples': 1368192, 'steps': 7125, 'loss/train': 2.177485942840576} +11/06/2021 22:14:50 - INFO - __main__ - Step 7127: {'lr': 0.0004985215215351869, 'samples': 1368384, 'steps': 7126, 'loss/train': 1.9587048292160034} +11/06/2021 22:14:51 - INFO - __main__ - Step 7128: {'lr': 0.0004985209451937999, 'samples': 1368576, 'steps': 7127, 'loss/train': 2.1263420581817627} +11/06/2021 22:14:51 - INFO - __main__ - Step 7129: {'lr': 0.0004985203687404333, 'samples': 1368768, 'steps': 7128, 'loss/train': 1.8560582399368286} +11/06/2021 22:14:52 - INFO - __main__ - Step 7130: {'lr': 0.0004985197921750871, 'samples': 1368960, 'steps': 7129, 'loss/train': 1.6565303802490234} +11/06/2021 22:14:52 - INFO - __main__ - Step 7131: {'lr': 0.0004985192154977619, 'samples': 1369152, 'steps': 7130, 'loss/train': 1.868842601776123} +11/06/2021 22:14:53 - INFO - __main__ - Step 7132: {'lr': 0.0004985186387084577, 'samples': 1369344, 'steps': 7131, 'loss/train': 1.80448317527771} +11/06/2021 22:14:53 - INFO - __main__ - Step 7133: {'lr': 0.0004985180618071748, 'samples': 1369536, 'steps': 7132, 'loss/train': 1.7268800735473633} +11/06/2021 22:14:53 - INFO - __main__ - Step 7134: {'lr': 0.0004985174847939135, 'samples': 1369728, 'steps': 7133, 'loss/train': 2.039775848388672} +11/06/2021 22:14:55 - INFO - __main__ - Step 7135: {'lr': 0.0004985169076686741, 'samples': 1369920, 'steps': 7134, 'loss/train': 1.5857948064804077} +11/06/2021 22:14:55 - INFO - __main__ - Step 7136: {'lr': 0.0004985163304314568, 'samples': 1370112, 'steps': 7135, 'loss/train': 1.8448445796966553} +11/06/2021 22:14:55 - INFO - __main__ - Step 7137: {'lr': 0.0004985157530822619, 'samples': 1370304, 'steps': 7136, 'loss/train': 1.450709342956543} +11/06/2021 22:14:56 - INFO - __main__ - Step 7138: {'lr': 0.0004985151756210897, 'samples': 1370496, 'steps': 7137, 'loss/train': 1.8486833572387695} +11/06/2021 22:14:56 - INFO - __main__ - Step 7139: {'lr': 0.0004985145980479402, 'samples': 1370688, 'steps': 7138, 'loss/train': 1.828140377998352} +11/06/2021 22:14:57 - INFO - __main__ - Step 7140: {'lr': 0.000498514020362814, 'samples': 1370880, 'steps': 7139, 'loss/train': 1.5421890020370483} +11/06/2021 22:14:57 - INFO - __main__ - Step 7141: {'lr': 0.0004985134425657111, 'samples': 1371072, 'steps': 7140, 'loss/train': 2.6949613094329834} +11/06/2021 22:14:58 - INFO - __main__ - Step 7142: {'lr': 0.000498512864656632, 'samples': 1371264, 'steps': 7141, 'loss/train': 1.5988658666610718} +11/06/2021 22:14:58 - INFO - __main__ - Step 7143: {'lr': 0.0004985122866355768, 'samples': 1371456, 'steps': 7142, 'loss/train': 2.1116602420806885} +11/06/2021 22:14:58 - INFO - __main__ - Step 7144: {'lr': 0.0004985117085025458, 'samples': 1371648, 'steps': 7143, 'loss/train': 2.3443734645843506} +11/06/2021 22:14:59 - INFO - __main__ - Step 7145: {'lr': 0.0004985111302575392, 'samples': 1371840, 'steps': 7144, 'loss/train': 1.9202158451080322} +11/06/2021 22:15:00 - INFO - __main__ - Step 7146: {'lr': 0.0004985105519005573, 'samples': 1372032, 'steps': 7145, 'loss/train': 1.7188575267791748} +11/06/2021 22:15:00 - INFO - __main__ - Step 7147: {'lr': 0.0004985099734316006, 'samples': 1372224, 'steps': 7146, 'loss/train': 1.5859005451202393} +11/06/2021 22:15:00 - INFO - __main__ - Step 7148: {'lr': 0.0004985093948506689, 'samples': 1372416, 'steps': 7147, 'loss/train': 1.5859280824661255} +11/06/2021 22:15:01 - INFO - __main__ - Step 7149: {'lr': 0.0004985088161577628, 'samples': 1372608, 'steps': 7148, 'loss/train': 1.8605209589004517} +11/06/2021 22:15:01 - INFO - __main__ - Step 7150: {'lr': 0.0004985082373528825, 'samples': 1372800, 'steps': 7149, 'loss/train': 2.1094627380371094} +11/06/2021 22:15:02 - INFO - __main__ - Step 7151: {'lr': 0.0004985076584360282, 'samples': 1372992, 'steps': 7150, 'loss/train': 2.0223774909973145} +11/06/2021 22:15:03 - INFO - __main__ - Step 7152: {'lr': 0.0004985070794072002, 'samples': 1373184, 'steps': 7151, 'loss/train': 2.0557656288146973} +11/06/2021 22:15:03 - INFO - __main__ - Step 7153: {'lr': 0.0004985065002663986, 'samples': 1373376, 'steps': 7152, 'loss/train': 1.9789502620697021} +11/06/2021 22:15:03 - INFO - __main__ - Step 7154: {'lr': 0.000498505921013624, 'samples': 1373568, 'steps': 7153, 'loss/train': 1.9508652687072754} +11/06/2021 22:15:04 - INFO - __main__ - Step 7155: {'lr': 0.0004985053416488764, 'samples': 1373760, 'steps': 7154, 'loss/train': 2.078094244003296} +11/06/2021 22:15:05 - INFO - __main__ - Step 7156: {'lr': 0.0004985047621721561, 'samples': 1373952, 'steps': 7155, 'loss/train': 0.8238686323165894} +11/06/2021 22:15:05 - INFO - __main__ - Step 7157: {'lr': 0.0004985041825834634, 'samples': 1374144, 'steps': 7156, 'loss/train': 1.8907822370529175} +11/06/2021 22:15:05 - INFO - __main__ - Step 7158: {'lr': 0.0004985036028827986, 'samples': 1374336, 'steps': 7157, 'loss/train': 2.6892762184143066} +11/06/2021 22:15:06 - INFO - __main__ - Step 7159: {'lr': 0.0004985030230701619, 'samples': 1374528, 'steps': 7158, 'loss/train': 2.3940746784210205} +11/06/2021 22:15:06 - INFO - __main__ - Step 7160: {'lr': 0.0004985024431455534, 'samples': 1374720, 'steps': 7159, 'loss/train': 1.8155590295791626} +11/06/2021 22:15:07 - INFO - __main__ - Step 7161: {'lr': 0.0004985018631089738, 'samples': 1374912, 'steps': 7160, 'loss/train': 2.003696918487549} +11/06/2021 22:15:07 - INFO - __main__ - Step 7162: {'lr': 0.0004985012829604228, 'samples': 1375104, 'steps': 7161, 'loss/train': 1.8686398267745972} +11/06/2021 22:15:08 - INFO - __main__ - Step 7163: {'lr': 0.0004985007026999011, 'samples': 1375296, 'steps': 7162, 'loss/train': 1.7682377099990845} +11/06/2021 22:15:08 - INFO - __main__ - Step 7164: {'lr': 0.0004985001223274089, 'samples': 1375488, 'steps': 7163, 'loss/train': 2.357848644256592} +11/06/2021 22:15:08 - INFO - __main__ - Step 7165: {'lr': 0.0004984995418429463, 'samples': 1375680, 'steps': 7164, 'loss/train': 2.2802202701568604} +11/06/2021 22:15:09 - INFO - __main__ - Step 7166: {'lr': 0.0004984989612465137, 'samples': 1375872, 'steps': 7165, 'loss/train': 2.0252628326416016} +11/06/2021 22:15:10 - INFO - __main__ - Step 7167: {'lr': 0.0004984983805381112, 'samples': 1376064, 'steps': 7166, 'loss/train': 1.8542309999465942} +11/06/2021 22:15:10 - INFO - __main__ - Step 7168: {'lr': 0.0004984977997177393, 'samples': 1376256, 'steps': 7167, 'loss/train': 1.5369564294815063} +11/06/2021 22:15:10 - INFO - __main__ - Step 7169: {'lr': 0.000498497218785398, 'samples': 1376448, 'steps': 7168, 'loss/train': 1.955859899520874} +11/06/2021 22:15:11 - INFO - __main__ - Step 7170: {'lr': 0.0004984966377410878, 'samples': 1376640, 'steps': 7169, 'loss/train': 2.5765957832336426} +11/06/2021 22:15:12 - INFO - __main__ - Step 7171: {'lr': 0.0004984960565848086, 'samples': 1376832, 'steps': 7170, 'loss/train': 2.264620304107666} +11/06/2021 22:15:12 - INFO - __main__ - Step 7172: {'lr': 0.0004984954753165612, 'samples': 1377024, 'steps': 7171, 'loss/train': 1.8249037265777588} +11/06/2021 22:15:13 - INFO - __main__ - Step 7173: {'lr': 0.0004984948939363455, 'samples': 1377216, 'steps': 7172, 'loss/train': 1.3821079730987549} +11/06/2021 22:15:13 - INFO - __main__ - Step 7174: {'lr': 0.0004984943124441617, 'samples': 1377408, 'steps': 7173, 'loss/train': 1.980968952178955} +11/06/2021 22:15:13 - INFO - __main__ - Step 7175: {'lr': 0.0004984937308400104, 'samples': 1377600, 'steps': 7174, 'loss/train': 1.0405446290969849} +11/06/2021 22:15:15 - INFO - __main__ - Step 7176: {'lr': 0.0004984931491238915, 'samples': 1377792, 'steps': 7175, 'loss/train': 2.0840656757354736} +11/06/2021 22:15:15 - INFO - __main__ - Step 7177: {'lr': 0.0004984925672958055, 'samples': 1377984, 'steps': 7176, 'loss/train': 1.7736377716064453} +11/06/2021 22:15:15 - INFO - __main__ - Step 7178: {'lr': 0.0004984919853557526, 'samples': 1378176, 'steps': 7177, 'loss/train': 2.2246837615966797} +11/06/2021 22:15:16 - INFO - __main__ - Step 7179: {'lr': 0.000498491403303733, 'samples': 1378368, 'steps': 7178, 'loss/train': 2.4547572135925293} +11/06/2021 22:15:16 - INFO - __main__ - Step 7180: {'lr': 0.000498490821139747, 'samples': 1378560, 'steps': 7179, 'loss/train': 1.4960209131240845} +11/06/2021 22:15:16 - INFO - __main__ - Step 7181: {'lr': 0.0004984902388637949, 'samples': 1378752, 'steps': 7180, 'loss/train': 1.8791706562042236} +11/06/2021 22:15:17 - INFO - __main__ - Step 7182: {'lr': 0.000498489656475877, 'samples': 1378944, 'steps': 7181, 'loss/train': 2.0455527305603027} +11/06/2021 22:15:18 - INFO - __main__ - Step 7183: {'lr': 0.0004984890739759934, 'samples': 1379136, 'steps': 7182, 'loss/train': 1.8560911417007446} +11/06/2021 22:15:18 - INFO - __main__ - Step 7184: {'lr': 0.0004984884913641444, 'samples': 1379328, 'steps': 7183, 'loss/train': 2.0507397651672363} +11/06/2021 22:15:18 - INFO - __main__ - Step 7185: {'lr': 0.0004984879086403304, 'samples': 1379520, 'steps': 7184, 'loss/train': 2.017399311065674} +11/06/2021 22:15:19 - INFO - __main__ - Step 7186: {'lr': 0.0004984873258045517, 'samples': 1379712, 'steps': 7185, 'loss/train': 1.7196428775787354} +11/06/2021 22:15:19 - INFO - __main__ - Step 7187: {'lr': 0.0004984867428568083, 'samples': 1379904, 'steps': 7186, 'loss/train': 1.79092276096344} +11/06/2021 22:15:20 - INFO - __main__ - Step 7188: {'lr': 0.0004984861597971006, 'samples': 1380096, 'steps': 7187, 'loss/train': 2.169832468032837} +11/06/2021 22:15:21 - INFO - __main__ - Step 7189: {'lr': 0.000498485576625429, 'samples': 1380288, 'steps': 7188, 'loss/train': 1.9039487838745117} +11/06/2021 22:15:21 - INFO - __main__ - Step 7190: {'lr': 0.0004984849933417935, 'samples': 1380480, 'steps': 7189, 'loss/train': 1.6038901805877686} +11/06/2021 22:15:21 - INFO - __main__ - Step 7191: {'lr': 0.0004984844099461945, 'samples': 1380672, 'steps': 7190, 'loss/train': 1.7970324754714966} +11/06/2021 22:15:22 - INFO - __main__ - Step 7192: {'lr': 0.0004984838264386322, 'samples': 1380864, 'steps': 7191, 'loss/train': 1.7720707654953003} +11/06/2021 22:15:23 - INFO - __main__ - Step 7193: {'lr': 0.000498483242819107, 'samples': 1381056, 'steps': 7192, 'loss/train': 1.6350319385528564} +11/06/2021 22:15:23 - INFO - __main__ - Step 7194: {'lr': 0.0004984826590876192, 'samples': 1381248, 'steps': 7193, 'loss/train': 1.857775092124939} +11/06/2021 22:15:23 - INFO - __main__ - Step 7195: {'lr': 0.0004984820752441688, 'samples': 1381440, 'steps': 7194, 'loss/train': 1.664402961730957} +11/06/2021 22:15:24 - INFO - __main__ - Step 7196: {'lr': 0.0004984814912887563, 'samples': 1381632, 'steps': 7195, 'loss/train': 2.1821253299713135} +11/06/2021 22:15:24 - INFO - __main__ - Step 7197: {'lr': 0.0004984809072213818, 'samples': 1381824, 'steps': 7196, 'loss/train': 1.2754813432693481} +11/06/2021 22:15:25 - INFO - __main__ - Step 7198: {'lr': 0.0004984803230420457, 'samples': 1382016, 'steps': 7197, 'loss/train': 1.7471867799758911} +11/06/2021 22:15:25 - INFO - __main__ - Step 7199: {'lr': 0.0004984797387507481, 'samples': 1382208, 'steps': 7198, 'loss/train': 1.889627456665039} +11/06/2021 22:15:26 - INFO - __main__ - Step 7200: {'lr': 0.0004984791543474896, 'samples': 1382400, 'steps': 7199, 'loss/train': 1.987942099571228} +11/06/2021 22:15:26 - INFO - __main__ - Step 7201: {'lr': 0.0004984785698322699, 'samples': 1382592, 'steps': 7200, 'loss/train': 1.3614236116409302} +11/06/2021 22:15:26 - INFO - __main__ - Step 7202: {'lr': 0.0004984779852050898, 'samples': 1382784, 'steps': 7201, 'loss/train': 1.576859712600708} +11/06/2021 22:15:28 - INFO - __main__ - Step 7203: {'lr': 0.0004984774004659493, 'samples': 1382976, 'steps': 7202, 'loss/train': 2.200059413909912} +11/06/2021 22:15:28 - INFO - __main__ - Step 7204: {'lr': 0.0004984768156148489, 'samples': 1383168, 'steps': 7203, 'loss/train': 2.1063573360443115} +11/06/2021 22:15:28 - INFO - __main__ - Step 7205: {'lr': 0.0004984762306517883, 'samples': 1383360, 'steps': 7204, 'loss/train': 2.0486106872558594} +11/06/2021 22:15:29 - INFO - __main__ - Step 7206: {'lr': 0.0004984756455767684, 'samples': 1383552, 'steps': 7205, 'loss/train': 1.8581416606903076} +11/06/2021 22:15:29 - INFO - __main__ - Step 7207: {'lr': 0.0004984750603897892, 'samples': 1383744, 'steps': 7206, 'loss/train': 1.1366732120513916} +11/06/2021 22:15:29 - INFO - __main__ - Step 7208: {'lr': 0.0004984744750908509, 'samples': 1383936, 'steps': 7207, 'loss/train': 1.8445619344711304} +11/06/2021 22:15:30 - INFO - __main__ - Step 7209: {'lr': 0.0004984738896799539, 'samples': 1384128, 'steps': 7208, 'loss/train': 2.4114151000976562} +11/06/2021 22:15:31 - INFO - __main__ - Step 7210: {'lr': 0.0004984733041570983, 'samples': 1384320, 'steps': 7209, 'loss/train': 1.8552770614624023} +11/06/2021 22:15:31 - INFO - __main__ - Step 7211: {'lr': 0.0004984727185222846, 'samples': 1384512, 'steps': 7210, 'loss/train': 2.154346466064453} +11/06/2021 22:15:31 - INFO - __main__ - Step 7212: {'lr': 0.0004984721327755128, 'samples': 1384704, 'steps': 7211, 'loss/train': 2.079803466796875} +11/06/2021 22:15:32 - INFO - __main__ - Step 7213: {'lr': 0.0004984715469167835, 'samples': 1384896, 'steps': 7212, 'loss/train': 1.798585295677185} +11/06/2021 22:15:33 - INFO - __main__ - Step 7214: {'lr': 0.0004984709609460966, 'samples': 1385088, 'steps': 7213, 'loss/train': 1.8755601644515991} +11/06/2021 22:15:33 - INFO - __main__ - Step 7215: {'lr': 0.0004984703748634524, 'samples': 1385280, 'steps': 7214, 'loss/train': 1.9229755401611328} +11/06/2021 22:15:33 - INFO - __main__ - Step 7216: {'lr': 0.0004984697886688514, 'samples': 1385472, 'steps': 7215, 'loss/train': 2.1766183376312256} +11/06/2021 22:15:34 - INFO - __main__ - Step 7217: {'lr': 0.0004984692023622938, 'samples': 1385664, 'steps': 7216, 'loss/train': 2.0930893421173096} +11/06/2021 22:15:34 - INFO - __main__ - Step 7218: {'lr': 0.0004984686159437798, 'samples': 1385856, 'steps': 7217, 'loss/train': 1.6894450187683105} +11/06/2021 22:15:35 - INFO - __main__ - Step 7219: {'lr': 0.0004984680294133096, 'samples': 1386048, 'steps': 7218, 'loss/train': 2.3785271644592285} +11/06/2021 22:15:35 - INFO - __main__ - Step 7220: {'lr': 0.0004984674427708836, 'samples': 1386240, 'steps': 7219, 'loss/train': 2.290306806564331} +11/06/2021 22:15:36 - INFO - __main__ - Step 7221: {'lr': 0.000498466856016502, 'samples': 1386432, 'steps': 7220, 'loss/train': 1.620937705039978} +11/06/2021 22:15:36 - INFO - __main__ - Step 7222: {'lr': 0.000498466269150165, 'samples': 1386624, 'steps': 7221, 'loss/train': 1.4030883312225342} +11/06/2021 22:15:36 - INFO - __main__ - Step 7223: {'lr': 0.000498465682171873, 'samples': 1386816, 'steps': 7222, 'loss/train': 2.2824783325195312} +11/06/2021 22:15:37 - INFO - __main__ - Step 7224: {'lr': 0.0004984650950816262, 'samples': 1387008, 'steps': 7223, 'loss/train': 2.3977138996124268} +11/06/2021 22:15:38 - INFO - __main__ - Step 7225: {'lr': 0.0004984645078794248, 'samples': 1387200, 'steps': 7224, 'loss/train': 1.694911241531372} +11/06/2021 22:15:38 - INFO - __main__ - Step 7226: {'lr': 0.0004984639205652692, 'samples': 1387392, 'steps': 7225, 'loss/train': 2.0143306255340576} +11/06/2021 22:15:39 - INFO - __main__ - Step 7227: {'lr': 0.0004984633331391596, 'samples': 1387584, 'steps': 7226, 'loss/train': 1.6768375635147095} +11/06/2021 22:15:39 - INFO - __main__ - Step 7228: {'lr': 0.0004984627456010962, 'samples': 1387776, 'steps': 7227, 'loss/train': 1.5799198150634766} +11/06/2021 22:15:39 - INFO - __main__ - Step 7229: {'lr': 0.0004984621579510794, 'samples': 1387968, 'steps': 7228, 'loss/train': 1.486791729927063} +11/06/2021 22:15:40 - INFO - __main__ - Step 7230: {'lr': 0.0004984615701891093, 'samples': 1388160, 'steps': 7229, 'loss/train': 3.868530035018921} +11/06/2021 22:15:41 - INFO - __main__ - Step 7231: {'lr': 0.0004984609823151863, 'samples': 1388352, 'steps': 7230, 'loss/train': 0.9350582957267761} +11/06/2021 22:15:41 - INFO - __main__ - Step 7232: {'lr': 0.0004984603943293106, 'samples': 1388544, 'steps': 7231, 'loss/train': 0.9871623516082764} +11/06/2021 22:15:41 - INFO - __main__ - Step 7233: {'lr': 0.0004984598062314824, 'samples': 1388736, 'steps': 7232, 'loss/train': 1.3852111101150513} +11/06/2021 22:15:42 - INFO - __main__ - Step 7234: {'lr': 0.0004984592180217022, 'samples': 1388928, 'steps': 7233, 'loss/train': 1.602423906326294} +11/06/2021 22:15:43 - INFO - __main__ - Step 7235: {'lr': 0.00049845862969997, 'samples': 1389120, 'steps': 7234, 'loss/train': 2.038180351257324} +11/06/2021 22:15:43 - INFO - __main__ - Step 7236: {'lr': 0.0004984580412662862, 'samples': 1389312, 'steps': 7235, 'loss/train': 2.45739483833313} +11/06/2021 22:15:44 - INFO - __main__ - Step 7237: {'lr': 0.000498457452720651, 'samples': 1389504, 'steps': 7236, 'loss/train': 2.169727087020874} +11/06/2021 22:15:44 - INFO - __main__ - Step 7238: {'lr': 0.0004984568640630648, 'samples': 1389696, 'steps': 7237, 'loss/train': 1.3969769477844238} +11/06/2021 22:15:44 - INFO - __main__ - Step 7239: {'lr': 0.0004984562752935278, 'samples': 1389888, 'steps': 7238, 'loss/train': 2.331590175628662} +11/06/2021 22:15:45 - INFO - __main__ - Step 7240: {'lr': 0.0004984556864120401, 'samples': 1390080, 'steps': 7239, 'loss/train': 1.9875437021255493} +11/06/2021 22:15:46 - INFO - __main__ - Step 7241: {'lr': 0.0004984550974186021, 'samples': 1390272, 'steps': 7240, 'loss/train': 2.1947824954986572} +11/06/2021 22:15:46 - INFO - __main__ - Step 7242: {'lr': 0.0004984545083132142, 'samples': 1390464, 'steps': 7241, 'loss/train': 1.9179041385650635} +11/06/2021 22:15:46 - INFO - __main__ - Step 7243: {'lr': 0.0004984539190958765, 'samples': 1390656, 'steps': 7242, 'loss/train': 2.117086887359619} +11/06/2021 22:15:47 - INFO - __main__ - Step 7244: {'lr': 0.0004984533297665892, 'samples': 1390848, 'steps': 7243, 'loss/train': 1.8736786842346191} +11/06/2021 22:15:48 - INFO - __main__ - Step 7245: {'lr': 0.0004984527403253527, 'samples': 1391040, 'steps': 7244, 'loss/train': 2.511869430541992} +11/06/2021 22:15:48 - INFO - __main__ - Step 7246: {'lr': 0.0004984521507721672, 'samples': 1391232, 'steps': 7245, 'loss/train': 2.5657119750976562} +11/06/2021 22:15:48 - INFO - __main__ - Step 7247: {'lr': 0.0004984515611070331, 'samples': 1391424, 'steps': 7246, 'loss/train': 1.9452552795410156} +11/06/2021 22:15:49 - INFO - __main__ - Step 7248: {'lr': 0.0004984509713299505, 'samples': 1391616, 'steps': 7247, 'loss/train': 1.7578961849212646} +11/06/2021 22:15:49 - INFO - __main__ - Step 7249: {'lr': 0.0004984503814409198, 'samples': 1391808, 'steps': 7248, 'loss/train': 1.7365186214447021} +11/06/2021 22:15:49 - INFO - __main__ - Step 7250: {'lr': 0.000498449791439941, 'samples': 1392000, 'steps': 7249, 'loss/train': 2.028444766998291} +11/06/2021 22:15:50 - INFO - __main__ - Step 7251: {'lr': 0.0004984492013270147, 'samples': 1392192, 'steps': 7250, 'loss/train': 1.9997104406356812} +11/06/2021 22:15:51 - INFO - __main__ - Step 7252: {'lr': 0.0004984486111021411, 'samples': 1392384, 'steps': 7251, 'loss/train': 1.7183914184570312} +11/06/2021 22:15:51 - INFO - __main__ - Step 7253: {'lr': 0.0004984480207653202, 'samples': 1392576, 'steps': 7252, 'loss/train': 1.8998106718063354} +11/06/2021 22:15:52 - INFO - __main__ - Step 7254: {'lr': 0.0004984474303165526, 'samples': 1392768, 'steps': 7253, 'loss/train': 1.8647713661193848} +11/06/2021 22:15:52 - INFO - __main__ - Step 7255: {'lr': 0.0004984468397558384, 'samples': 1392960, 'steps': 7254, 'loss/train': 1.3238756656646729} +11/06/2021 22:15:53 - INFO - __main__ - Step 7256: {'lr': 0.0004984462490831778, 'samples': 1393152, 'steps': 7255, 'loss/train': 2.027043104171753} +11/06/2021 22:15:53 - INFO - __main__ - Step 7257: {'lr': 0.0004984456582985713, 'samples': 1393344, 'steps': 7256, 'loss/train': 1.4800242185592651} +11/06/2021 22:15:54 - INFO - __main__ - Step 7258: {'lr': 0.0004984450674020189, 'samples': 1393536, 'steps': 7257, 'loss/train': 2.1049439907073975} +11/06/2021 22:15:54 - INFO - __main__ - Step 7259: {'lr': 0.000498444476393521, 'samples': 1393728, 'steps': 7258, 'loss/train': 2.349273920059204} +11/06/2021 22:15:54 - INFO - __main__ - Step 7260: {'lr': 0.0004984438852730779, 'samples': 1393920, 'steps': 7259, 'loss/train': 1.9256495237350464} +11/06/2021 22:15:55 - INFO - __main__ - Step 7261: {'lr': 0.0004984432940406898, 'samples': 1394112, 'steps': 7260, 'loss/train': 1.3321802616119385} +11/06/2021 22:15:56 - INFO - __main__ - Step 7262: {'lr': 0.0004984427026963569, 'samples': 1394304, 'steps': 7261, 'loss/train': 1.8123741149902344} +11/06/2021 22:15:56 - INFO - __main__ - Step 7263: {'lr': 0.0004984421112400796, 'samples': 1394496, 'steps': 7262, 'loss/train': 1.7774724960327148} +11/06/2021 22:15:56 - INFO - __main__ - Step 7264: {'lr': 0.0004984415196718582, 'samples': 1394688, 'steps': 7263, 'loss/train': 1.5477303266525269} +11/06/2021 22:15:57 - INFO - __main__ - Step 7265: {'lr': 0.0004984409279916929, 'samples': 1394880, 'steps': 7264, 'loss/train': 1.974310278892517} +11/06/2021 22:15:58 - INFO - __main__ - Step 7266: {'lr': 0.0004984403361995839, 'samples': 1395072, 'steps': 7265, 'loss/train': 1.740934133529663} +11/06/2021 22:15:58 - INFO - __main__ - Step 7267: {'lr': 0.0004984397442955315, 'samples': 1395264, 'steps': 7266, 'loss/train': 2.080972194671631} +11/06/2021 22:15:59 - INFO - __main__ - Step 7268: {'lr': 0.0004984391522795359, 'samples': 1395456, 'steps': 7267, 'loss/train': 1.868264079093933} +11/06/2021 22:15:59 - INFO - __main__ - Step 7269: {'lr': 0.0004984385601515977, 'samples': 1395648, 'steps': 7268, 'loss/train': 1.7006977796554565} +11/06/2021 22:15:59 - INFO - __main__ - Step 7270: {'lr': 0.0004984379679117166, 'samples': 1395840, 'steps': 7269, 'loss/train': 2.674793004989624} +11/06/2021 22:16:00 - INFO - __main__ - Step 7271: {'lr': 0.0004984373755598934, 'samples': 1396032, 'steps': 7270, 'loss/train': 1.7683382034301758} +11/06/2021 22:16:01 - INFO - __main__ - Step 7272: {'lr': 0.0004984367830961281, 'samples': 1396224, 'steps': 7271, 'loss/train': 2.167809247970581} +11/06/2021 22:16:01 - INFO - __main__ - Step 7273: {'lr': 0.0004984361905204209, 'samples': 1396416, 'steps': 7272, 'loss/train': 1.7610995769500732} +11/06/2021 22:16:01 - INFO - __main__ - Step 7274: {'lr': 0.0004984355978327724, 'samples': 1396608, 'steps': 7273, 'loss/train': 1.7615541219711304} +11/06/2021 22:16:02 - INFO - __main__ - Step 7275: {'lr': 0.0004984350050331826, 'samples': 1396800, 'steps': 7274, 'loss/train': 1.920972466468811} +11/06/2021 22:16:03 - INFO - __main__ - Step 7276: {'lr': 0.0004984344121216518, 'samples': 1396992, 'steps': 7275, 'loss/train': 1.9374135732650757} +11/06/2021 22:16:03 - INFO - __main__ - Step 7277: {'lr': 0.0004984338190981802, 'samples': 1397184, 'steps': 7276, 'loss/train': 1.6864734888076782} +11/06/2021 22:16:04 - INFO - __main__ - Step 7278: {'lr': 0.0004984332259627682, 'samples': 1397376, 'steps': 7277, 'loss/train': 1.0560840368270874} +11/06/2021 22:16:04 - INFO - __main__ - Step 7279: {'lr': 0.000498432632715416, 'samples': 1397568, 'steps': 7278, 'loss/train': 0.6851865649223328} +11/06/2021 22:16:04 - INFO - __main__ - Step 7280: {'lr': 0.000498432039356124, 'samples': 1397760, 'steps': 7279, 'loss/train': 1.729858160018921} +11/06/2021 22:16:05 - INFO - __main__ - Step 7281: {'lr': 0.0004984314458848923, 'samples': 1397952, 'steps': 7280, 'loss/train': 1.9476943016052246} +11/06/2021 22:16:06 - INFO - __main__ - Step 7282: {'lr': 0.0004984308523017212, 'samples': 1398144, 'steps': 7281, 'loss/train': 1.9683444499969482} +11/06/2021 22:16:06 - INFO - __main__ - Step 7283: {'lr': 0.000498430258606611, 'samples': 1398336, 'steps': 7282, 'loss/train': 2.0607752799987793} +11/06/2021 22:16:06 - INFO - __main__ - Step 7284: {'lr': 0.000498429664799562, 'samples': 1398528, 'steps': 7283, 'loss/train': 2.243265151977539} +11/06/2021 22:16:07 - INFO - __main__ - Step 7285: {'lr': 0.0004984290708805743, 'samples': 1398720, 'steps': 7284, 'loss/train': 1.7015665769577026} +11/06/2021 22:16:07 - INFO - __main__ - Step 7286: {'lr': 0.0004984284768496484, 'samples': 1398912, 'steps': 7285, 'loss/train': 2.0108847618103027} +11/06/2021 22:16:08 - INFO - __main__ - Step 7287: {'lr': 0.0004984278827067844, 'samples': 1399104, 'steps': 7286, 'loss/train': 5.661211967468262} +11/06/2021 22:16:08 - INFO - __main__ - Step 7288: {'lr': 0.0004984272884519827, 'samples': 1399296, 'steps': 7287, 'loss/train': 2.067732572555542} +11/06/2021 22:16:09 - INFO - __main__ - Step 7289: {'lr': 0.0004984266940852434, 'samples': 1399488, 'steps': 7288, 'loss/train': 2.0083210468292236} +11/06/2021 22:16:09 - INFO - __main__ - Step 7290: {'lr': 0.0004984260996065671, 'samples': 1399680, 'steps': 7289, 'loss/train': 1.771776795387268} +11/06/2021 22:16:10 - INFO - __main__ - Step 7291: {'lr': 0.0004984255050159536, 'samples': 1399872, 'steps': 7290, 'loss/train': 2.357623815536499} +11/06/2021 22:16:10 - INFO - __main__ - Step 7292: {'lr': 0.0004984249103134035, 'samples': 1400064, 'steps': 7291, 'loss/train': 1.8594292402267456} +11/06/2021 22:16:11 - INFO - __main__ - Step 7293: {'lr': 0.0004984243154989168, 'samples': 1400256, 'steps': 7292, 'loss/train': 1.5568764209747314} +11/06/2021 22:16:11 - INFO - __main__ - Step 7294: {'lr': 0.0004984237205724942, 'samples': 1400448, 'steps': 7293, 'loss/train': 2.0495903491973877} +11/06/2021 22:16:12 - INFO - __main__ - Step 7295: {'lr': 0.0004984231255341355, 'samples': 1400640, 'steps': 7294, 'loss/train': 1.9171841144561768} +11/06/2021 22:16:12 - INFO - __main__ - Step 7296: {'lr': 0.0004984225303838413, 'samples': 1400832, 'steps': 7295, 'loss/train': 2.2132482528686523} +11/06/2021 22:16:12 - INFO - __main__ - Step 7297: {'lr': 0.0004984219351216116, 'samples': 1401024, 'steps': 7296, 'loss/train': 2.4018189907073975} +11/06/2021 22:16:13 - INFO - __main__ - Step 7298: {'lr': 0.000498421339747447, 'samples': 1401216, 'steps': 7297, 'loss/train': 1.9810959100723267} +11/06/2021 22:16:14 - INFO - __main__ - Step 7299: {'lr': 0.0004984207442613474, 'samples': 1401408, 'steps': 7298, 'loss/train': 2.1550214290618896} +11/06/2021 22:16:14 - INFO - __main__ - Step 7300: {'lr': 0.0004984201486633134, 'samples': 1401600, 'steps': 7299, 'loss/train': 1.7208765745162964} +11/06/2021 22:16:14 - INFO - __main__ - Step 7301: {'lr': 0.0004984195529533451, 'samples': 1401792, 'steps': 7300, 'loss/train': 1.912482500076294} +11/06/2021 22:16:15 - INFO - __main__ - Step 7302: {'lr': 0.0004984189571314426, 'samples': 1401984, 'steps': 7301, 'loss/train': 2.2242941856384277} +11/06/2021 22:16:16 - INFO - __main__ - Step 7303: {'lr': 0.0004984183611976065, 'samples': 1402176, 'steps': 7302, 'loss/train': 1.918655276298523} +11/06/2021 22:16:16 - INFO - __main__ - Step 7304: {'lr': 0.0004984177651518369, 'samples': 1402368, 'steps': 7303, 'loss/train': 2.114764451980591} +11/06/2021 22:16:16 - INFO - __main__ - Step 7305: {'lr': 0.0004984171689941341, 'samples': 1402560, 'steps': 7304, 'loss/train': 1.9402523040771484} +11/06/2021 22:16:17 - INFO - __main__ - Step 7306: {'lr': 0.0004984165727244984, 'samples': 1402752, 'steps': 7305, 'loss/train': 1.6583056449890137} +11/06/2021 22:16:17 - INFO - __main__ - Step 7307: {'lr': 0.0004984159763429299, 'samples': 1402944, 'steps': 7306, 'loss/train': 1.5926767587661743} +11/06/2021 22:16:17 - INFO - __main__ - Step 7308: {'lr': 0.0004984153798494291, 'samples': 1403136, 'steps': 7307, 'loss/train': 1.6592446565628052} +11/06/2021 22:16:18 - INFO - __main__ - Step 7309: {'lr': 0.000498414783243996, 'samples': 1403328, 'steps': 7308, 'loss/train': 1.728884220123291} +11/06/2021 22:16:19 - INFO - __main__ - Step 7310: {'lr': 0.0004984141865266312, 'samples': 1403520, 'steps': 7309, 'loss/train': 0.43410855531692505} +11/06/2021 22:16:19 - INFO - __main__ - Step 7311: {'lr': 0.0004984135896973348, 'samples': 1403712, 'steps': 7310, 'loss/train': 2.0036983489990234} +11/06/2021 22:16:20 - INFO - __main__ - Step 7312: {'lr': 0.000498412992756107, 'samples': 1403904, 'steps': 7311, 'loss/train': 1.7266615629196167} +11/06/2021 22:16:20 - INFO - __main__ - Step 7313: {'lr': 0.0004984123957029482, 'samples': 1404096, 'steps': 7312, 'loss/train': 1.9898042678833008} +11/06/2021 22:16:21 - INFO - __main__ - Step 7314: {'lr': 0.0004984117985378586, 'samples': 1404288, 'steps': 7313, 'loss/train': 2.5833494663238525} +11/06/2021 22:16:21 - INFO - __main__ - Step 7315: {'lr': 0.0004984112012608384, 'samples': 1404480, 'steps': 7314, 'loss/train': 1.9153599739074707} +11/06/2021 22:16:22 - INFO - __main__ - Step 7316: {'lr': 0.000498410603871888, 'samples': 1404672, 'steps': 7315, 'loss/train': 1.9567968845367432} +11/06/2021 22:16:22 - INFO - __main__ - Step 7317: {'lr': 0.0004984100063710076, 'samples': 1404864, 'steps': 7316, 'loss/train': 1.922874927520752} +11/06/2021 22:16:22 - INFO - __main__ - Step 7318: {'lr': 0.0004984094087581975, 'samples': 1405056, 'steps': 7317, 'loss/train': 1.7780122756958008} +11/06/2021 22:16:23 - INFO - __main__ - Step 7319: {'lr': 0.0004984088110334579, 'samples': 1405248, 'steps': 7318, 'loss/train': 1.6674338579177856} +11/06/2021 22:16:24 - INFO - __main__ - Step 7320: {'lr': 0.0004984082131967892, 'samples': 1405440, 'steps': 7319, 'loss/train': 1.5355974435806274} +11/06/2021 22:16:24 - INFO - __main__ - Step 7321: {'lr': 0.0004984076152481916, 'samples': 1405632, 'steps': 7320, 'loss/train': 1.7139782905578613} +11/06/2021 22:16:24 - INFO - __main__ - Step 7322: {'lr': 0.0004984070171876653, 'samples': 1405824, 'steps': 7321, 'loss/train': 2.0687177181243896} +11/06/2021 22:16:25 - INFO - __main__ - Step 7323: {'lr': 0.0004984064190152106, 'samples': 1406016, 'steps': 7322, 'loss/train': 1.93816077709198} +11/06/2021 22:16:26 - INFO - __main__ - Step 7324: {'lr': 0.0004984058207308279, 'samples': 1406208, 'steps': 7323, 'loss/train': 1.9266688823699951} +11/06/2021 22:16:26 - INFO - __main__ - Step 7325: {'lr': 0.0004984052223345174, 'samples': 1406400, 'steps': 7324, 'loss/train': 1.676986575126648} +11/06/2021 22:16:27 - INFO - __main__ - Step 7326: {'lr': 0.0004984046238262792, 'samples': 1406592, 'steps': 7325, 'loss/train': 1.8388060331344604} +11/06/2021 22:16:27 - INFO - __main__ - Step 7327: {'lr': 0.0004984040252061137, 'samples': 1406784, 'steps': 7326, 'loss/train': 2.036705255508423} +11/06/2021 22:16:27 - INFO - __main__ - Step 7328: {'lr': 0.0004984034264740213, 'samples': 1406976, 'steps': 7327, 'loss/train': 1.4209593534469604} +11/06/2021 22:16:28 - INFO - __main__ - Step 7329: {'lr': 0.0004984028276300021, 'samples': 1407168, 'steps': 7328, 'loss/train': 1.2647329568862915} +11/06/2021 22:16:29 - INFO - __main__ - Step 7330: {'lr': 0.0004984022286740565, 'samples': 1407360, 'steps': 7329, 'loss/train': 1.7428815364837646} +11/06/2021 22:16:29 - INFO - __main__ - Step 7331: {'lr': 0.0004984016296061846, 'samples': 1407552, 'steps': 7330, 'loss/train': 1.4878357648849487} +11/06/2021 22:16:29 - INFO - __main__ - Step 7332: {'lr': 0.0004984010304263868, 'samples': 1407744, 'steps': 7331, 'loss/train': 1.8269178867340088} +11/06/2021 22:16:30 - INFO - __main__ - Step 7333: {'lr': 0.0004984004311346632, 'samples': 1407936, 'steps': 7332, 'loss/train': 1.686158299446106} +11/06/2021 22:16:31 - INFO - __main__ - Step 7334: {'lr': 0.0004983998317310143, 'samples': 1408128, 'steps': 7333, 'loss/train': 0.8892830610275269} +11/06/2021 22:16:31 - INFO - __main__ - Step 7335: {'lr': 0.0004983992322154403, 'samples': 1408320, 'steps': 7334, 'loss/train': 1.7509515285491943} +11/06/2021 22:16:31 - INFO - __main__ - Step 7336: {'lr': 0.0004983986325879414, 'samples': 1408512, 'steps': 7335, 'loss/train': 1.561832070350647} +11/06/2021 22:16:32 - INFO - __main__ - Step 7337: {'lr': 0.0004983980328485179, 'samples': 1408704, 'steps': 7336, 'loss/train': 1.7405585050582886} +11/06/2021 22:16:32 - INFO - __main__ - Step 7338: {'lr': 0.0004983974329971702, 'samples': 1408896, 'steps': 7337, 'loss/train': 1.8037465810775757} +11/06/2021 22:16:32 - INFO - __main__ - Step 7339: {'lr': 0.0004983968330338983, 'samples': 1409088, 'steps': 7338, 'loss/train': 1.8311342000961304} +11/06/2021 22:16:33 - INFO - __main__ - Step 7340: {'lr': 0.0004983962329587026, 'samples': 1409280, 'steps': 7339, 'loss/train': 1.649807333946228} +11/06/2021 22:16:34 - INFO - __main__ - Step 7341: {'lr': 0.0004983956327715835, 'samples': 1409472, 'steps': 7340, 'loss/train': 1.9435052871704102} +11/06/2021 22:16:34 - INFO - __main__ - Step 7342: {'lr': 0.000498395032472541, 'samples': 1409664, 'steps': 7341, 'loss/train': 1.9914734363555908} +11/06/2021 22:16:34 - INFO - __main__ - Step 7343: {'lr': 0.0004983944320615757, 'samples': 1409856, 'steps': 7342, 'loss/train': 2.154550552368164} +11/06/2021 22:16:35 - INFO - __main__ - Step 7344: {'lr': 0.0004983938315386877, 'samples': 1410048, 'steps': 7343, 'loss/train': 0.9631898403167725} +11/06/2021 22:16:36 - INFO - __main__ - Step 7345: {'lr': 0.0004983932309038773, 'samples': 1410240, 'steps': 7344, 'loss/train': 1.8528187274932861} +11/06/2021 22:16:36 - INFO - __main__ - Step 7346: {'lr': 0.0004983926301571445, 'samples': 1410432, 'steps': 7345, 'loss/train': 1.4792355298995972} +11/06/2021 22:16:36 - INFO - __main__ - Step 7347: {'lr': 0.00049839202929849, 'samples': 1410624, 'steps': 7346, 'loss/train': 2.132795572280884} +11/06/2021 22:16:37 - INFO - __main__ - Step 7348: {'lr': 0.0004983914283279139, 'samples': 1410816, 'steps': 7347, 'loss/train': 1.8769862651824951} +11/06/2021 22:16:37 - INFO - __main__ - Step 7349: {'lr': 0.0004983908272454164, 'samples': 1411008, 'steps': 7348, 'loss/train': 1.8160367012023926} +11/06/2021 22:16:38 - INFO - __main__ - Step 7350: {'lr': 0.0004983902260509978, 'samples': 1411200, 'steps': 7349, 'loss/train': 0.7067152857780457} +11/06/2021 22:16:38 - INFO - __main__ - Step 7351: {'lr': 0.0004983896247446585, 'samples': 1411392, 'steps': 7350, 'loss/train': 1.9250173568725586} +11/06/2021 22:16:39 - INFO - __main__ - Step 7352: {'lr': 0.0004983890233263986, 'samples': 1411584, 'steps': 7351, 'loss/train': 1.8521647453308105} +11/06/2021 22:16:39 - INFO - __main__ - Step 7353: {'lr': 0.0004983884217962185, 'samples': 1411776, 'steps': 7352, 'loss/train': 1.7597779035568237} +11/06/2021 22:16:40 - INFO - __main__ - Step 7354: {'lr': 0.0004983878201541183, 'samples': 1411968, 'steps': 7353, 'loss/train': 1.017517328262329} +11/06/2021 22:16:41 - INFO - __main__ - Step 7355: {'lr': 0.0004983872184000984, 'samples': 1412160, 'steps': 7354, 'loss/train': 2.1541800498962402} +11/06/2021 22:16:41 - INFO - __main__ - Step 7356: {'lr': 0.0004983866165341592, 'samples': 1412352, 'steps': 7355, 'loss/train': 2.184023380279541} +11/06/2021 22:16:41 - INFO - __main__ - Step 7357: {'lr': 0.0004983860145563006, 'samples': 1412544, 'steps': 7356, 'loss/train': 1.9269651174545288} +11/06/2021 22:16:42 - INFO - __main__ - Step 7358: {'lr': 0.0004983854124665232, 'samples': 1412736, 'steps': 7357, 'loss/train': 0.9575059413909912} +11/06/2021 22:16:42 - INFO - __main__ - Step 7359: {'lr': 0.0004983848102648273, 'samples': 1412928, 'steps': 7358, 'loss/train': 1.8082619905471802} +11/06/2021 22:16:43 - INFO - __main__ - Step 7360: {'lr': 0.0004983842079512128, 'samples': 1413120, 'steps': 7359, 'loss/train': 1.5754534006118774} +11/06/2021 22:16:43 - INFO - __main__ - Step 7361: {'lr': 0.0004983836055256804, 'samples': 1413312, 'steps': 7360, 'loss/train': 1.5222283601760864} +11/06/2021 22:16:44 - INFO - __main__ - Step 7362: {'lr': 0.0004983830029882301, 'samples': 1413504, 'steps': 7361, 'loss/train': 2.070965051651001} +11/06/2021 22:16:44 - INFO - __main__ - Step 7363: {'lr': 0.0004983824003388622, 'samples': 1413696, 'steps': 7362, 'loss/train': 1.8946985006332397} +11/06/2021 22:16:44 - INFO - __main__ - Step 7364: {'lr': 0.0004983817975775771, 'samples': 1413888, 'steps': 7363, 'loss/train': 1.666754126548767} +11/06/2021 22:16:45 - INFO - __main__ - Step 7365: {'lr': 0.000498381194704375, 'samples': 1414080, 'steps': 7364, 'loss/train': 1.879746675491333} +11/06/2021 22:16:46 - INFO - __main__ - Step 7366: {'lr': 0.000498380591719256, 'samples': 1414272, 'steps': 7365, 'loss/train': 1.6441892385482788} +11/06/2021 22:16:46 - INFO - __main__ - Step 7367: {'lr': 0.0004983799886222207, 'samples': 1414464, 'steps': 7366, 'loss/train': 2.2601382732391357} +11/06/2021 22:16:47 - INFO - __main__ - Step 7368: {'lr': 0.0004983793854132693, 'samples': 1414656, 'steps': 7367, 'loss/train': 1.803916335105896} +11/06/2021 22:16:47 - INFO - __main__ - Step 7369: {'lr': 0.0004983787820924019, 'samples': 1414848, 'steps': 7368, 'loss/train': 1.7164603471755981} +11/06/2021 22:16:48 - INFO - __main__ - Step 7370: {'lr': 0.0004983781786596187, 'samples': 1415040, 'steps': 7369, 'loss/train': 1.3875094652175903} +11/06/2021 22:16:48 - INFO - __main__ - Step 7371: {'lr': 0.0004983775751149204, 'samples': 1415232, 'steps': 7370, 'loss/train': 2.1840782165527344} +11/06/2021 22:16:49 - INFO - __main__ - Step 7372: {'lr': 0.0004983769714583067, 'samples': 1415424, 'steps': 7371, 'loss/train': 2.081000328063965} +11/06/2021 22:16:49 - INFO - __main__ - Step 7373: {'lr': 0.0004983763676897784, 'samples': 1415616, 'steps': 7372, 'loss/train': 1.749665379524231} +11/06/2021 22:16:49 - INFO - __main__ - Step 7374: {'lr': 0.0004983757638093355, 'samples': 1415808, 'steps': 7373, 'loss/train': 1.8339048624038696} +11/06/2021 22:16:50 - INFO - __main__ - Step 7375: {'lr': 0.0004983751598169781, 'samples': 1416000, 'steps': 7374, 'loss/train': 1.631373405456543} +11/06/2021 22:16:51 - INFO - __main__ - Step 7376: {'lr': 0.000498374555712707, 'samples': 1416192, 'steps': 7375, 'loss/train': 2.2265982627868652} +11/06/2021 22:16:51 - INFO - __main__ - Step 7377: {'lr': 0.000498373951496522, 'samples': 1416384, 'steps': 7376, 'loss/train': 2.2691292762756348} +11/06/2021 22:16:51 - INFO - __main__ - Step 7378: {'lr': 0.0004983733471684234, 'samples': 1416576, 'steps': 7377, 'loss/train': 2.114935874938965} +11/06/2021 22:16:52 - INFO - __main__ - Step 7379: {'lr': 0.0004983727427284118, 'samples': 1416768, 'steps': 7378, 'loss/train': 1.5053443908691406} +11/06/2021 22:16:52 - INFO - __main__ - Step 7380: {'lr': 0.0004983721381764873, 'samples': 1416960, 'steps': 7379, 'loss/train': 2.0003550052642822} +11/06/2021 22:16:53 - INFO - __main__ - Step 7381: {'lr': 0.00049837153351265, 'samples': 1417152, 'steps': 7380, 'loss/train': 1.6483396291732788} +11/06/2021 22:16:53 - INFO - __main__ - Step 7382: {'lr': 0.0004983709287369004, 'samples': 1417344, 'steps': 7381, 'loss/train': 1.4799424409866333} +11/06/2021 22:16:54 - INFO - __main__ - Step 7383: {'lr': 0.0004983703238492386, 'samples': 1417536, 'steps': 7382, 'loss/train': 1.8734862804412842} +11/06/2021 22:16:54 - INFO - __main__ - Step 7384: {'lr': 0.000498369718849665, 'samples': 1417728, 'steps': 7383, 'loss/train': 2.09423565864563} +11/06/2021 22:16:54 - INFO - __main__ - Step 7385: {'lr': 0.00049836911373818, 'samples': 1417920, 'steps': 7384, 'loss/train': 1.690798044204712} +11/06/2021 22:16:55 - INFO - __main__ - Step 7386: {'lr': 0.0004983685085147836, 'samples': 1418112, 'steps': 7385, 'loss/train': 1.6163359880447388} +11/06/2021 22:16:56 - INFO - __main__ - Step 7387: {'lr': 0.0004983679031794762, 'samples': 1418304, 'steps': 7386, 'loss/train': 1.860256552696228} +11/06/2021 22:16:56 - INFO - __main__ - Step 7388: {'lr': 0.000498367297732258, 'samples': 1418496, 'steps': 7387, 'loss/train': 1.9493474960327148} +11/06/2021 22:16:56 - INFO - __main__ - Step 7389: {'lr': 0.0004983666921731293, 'samples': 1418688, 'steps': 7388, 'loss/train': 1.6616744995117188} +11/06/2021 22:16:57 - INFO - __main__ - Step 7390: {'lr': 0.0004983660865020905, 'samples': 1418880, 'steps': 7389, 'loss/train': 1.901392936706543} +11/06/2021 22:16:58 - INFO - __main__ - Step 7391: {'lr': 0.0004983654807191418, 'samples': 1419072, 'steps': 7390, 'loss/train': 2.3318119049072266} +11/06/2021 22:16:58 - INFO - __main__ - Step 7392: {'lr': 0.0004983648748242833, 'samples': 1419264, 'steps': 7391, 'loss/train': 1.922995686531067} +11/06/2021 22:16:59 - INFO - __main__ - Step 7393: {'lr': 0.0004983642688175155, 'samples': 1419456, 'steps': 7392, 'loss/train': 1.9183114767074585} +11/06/2021 22:16:59 - INFO - __main__ - Step 7394: {'lr': 0.0004983636626988386, 'samples': 1419648, 'steps': 7393, 'loss/train': 2.0506041049957275} +11/06/2021 22:16:59 - INFO - __main__ - Step 7395: {'lr': 0.0004983630564682529, 'samples': 1419840, 'steps': 7394, 'loss/train': 1.6490904092788696} +11/06/2021 22:17:00 - INFO - __main__ - Step 7396: {'lr': 0.0004983624501257585, 'samples': 1420032, 'steps': 7395, 'loss/train': 2.0997846126556396} +11/06/2021 22:17:01 - INFO - __main__ - Step 7397: {'lr': 0.000498361843671356, 'samples': 1420224, 'steps': 7396, 'loss/train': 1.3421412706375122} +11/06/2021 22:17:01 - INFO - __main__ - Step 7398: {'lr': 0.0004983612371050453, 'samples': 1420416, 'steps': 7397, 'loss/train': 1.7991613149642944} +11/06/2021 22:17:01 - INFO - __main__ - Step 7399: {'lr': 0.000498360630426827, 'samples': 1420608, 'steps': 7398, 'loss/train': 2.0792791843414307} +11/06/2021 22:17:02 - INFO - __main__ - Step 7400: {'lr': 0.0004983600236367012, 'samples': 1420800, 'steps': 7399, 'loss/train': 3.388317346572876} +11/06/2021 22:17:03 - INFO - __main__ - Step 7401: {'lr': 0.0004983594167346681, 'samples': 1420992, 'steps': 7400, 'loss/train': 1.5198123455047607} +11/06/2021 22:17:03 - INFO - __main__ - Step 7402: {'lr': 0.0004983588097207283, 'samples': 1421184, 'steps': 7401, 'loss/train': 1.678063988685608} +11/06/2021 22:17:03 - INFO - __main__ - Step 7403: {'lr': 0.0004983582025948816, 'samples': 1421376, 'steps': 7402, 'loss/train': 1.8395053148269653} +11/06/2021 22:17:04 - INFO - __main__ - Step 7404: {'lr': 0.0004983575953571287, 'samples': 1421568, 'steps': 7403, 'loss/train': 0.9479645490646362} +11/06/2021 22:17:04 - INFO - __main__ - Step 7405: {'lr': 0.0004983569880074696, 'samples': 1421760, 'steps': 7404, 'loss/train': 1.9720947742462158} +11/06/2021 22:17:05 - INFO - __main__ - Step 7406: {'lr': 0.0004983563805459048, 'samples': 1421952, 'steps': 7405, 'loss/train': 1.7848727703094482} +11/06/2021 22:17:06 - INFO - __main__ - Step 7407: {'lr': 0.0004983557729724343, 'samples': 1422144, 'steps': 7406, 'loss/train': 1.2195593118667603} +11/06/2021 22:17:06 - INFO - __main__ - Step 7408: {'lr': 0.0004983551652870586, 'samples': 1422336, 'steps': 7407, 'loss/train': 1.9602643251419067} +11/06/2021 22:17:06 - INFO - __main__ - Step 7409: {'lr': 0.000498354557489778, 'samples': 1422528, 'steps': 7408, 'loss/train': 1.9274659156799316} +11/06/2021 22:17:07 - INFO - __main__ - Step 7410: {'lr': 0.0004983539495805925, 'samples': 1422720, 'steps': 7409, 'loss/train': 0.8858946561813354} +11/06/2021 22:17:07 - INFO - __main__ - Step 7411: {'lr': 0.0004983533415595026, 'samples': 1422912, 'steps': 7410, 'loss/train': 2.1833174228668213} +11/06/2021 22:17:08 - INFO - __main__ - Step 7412: {'lr': 0.0004983527334265085, 'samples': 1423104, 'steps': 7411, 'loss/train': 1.8606438636779785} +11/06/2021 22:17:08 - INFO - __main__ - Step 7413: {'lr': 0.0004983521251816105, 'samples': 1423296, 'steps': 7412, 'loss/train': 2.0643343925476074} +11/06/2021 22:17:09 - INFO - __main__ - Step 7414: {'lr': 0.0004983515168248088, 'samples': 1423488, 'steps': 7413, 'loss/train': 2.0445151329040527} +11/06/2021 22:17:09 - INFO - __main__ - Step 7415: {'lr': 0.0004983509083561038, 'samples': 1423680, 'steps': 7414, 'loss/train': 2.069981813430786} +11/06/2021 22:17:09 - INFO - __main__ - Step 7416: {'lr': 0.0004983502997754958, 'samples': 1423872, 'steps': 7415, 'loss/train': 1.200181245803833} +11/06/2021 22:17:11 - INFO - __main__ - Step 7417: {'lr': 0.0004983496910829849, 'samples': 1424064, 'steps': 7416, 'loss/train': 1.8883745670318604} +11/06/2021 22:17:11 - INFO - __main__ - Step 7418: {'lr': 0.0004983490822785715, 'samples': 1424256, 'steps': 7417, 'loss/train': 2.2220919132232666} +11/06/2021 22:17:11 - INFO - __main__ - Step 7419: {'lr': 0.0004983484733622558, 'samples': 1424448, 'steps': 7418, 'loss/train': 1.7355570793151855} +11/06/2021 22:17:12 - INFO - __main__ - Step 7420: {'lr': 0.0004983478643340382, 'samples': 1424640, 'steps': 7419, 'loss/train': 2.0675618648529053} +11/06/2021 22:17:12 - INFO - __main__ - Step 7421: {'lr': 0.0004983472551939186, 'samples': 1424832, 'steps': 7420, 'loss/train': 1.9630166292190552} +11/06/2021 22:17:13 - INFO - __main__ - Step 7422: {'lr': 0.0004983466459418978, 'samples': 1425024, 'steps': 7421, 'loss/train': 2.4349045753479004} +11/06/2021 22:17:13 - INFO - __main__ - Step 7423: {'lr': 0.0004983460365779759, 'samples': 1425216, 'steps': 7422, 'loss/train': 2.1964800357818604} +11/06/2021 22:17:14 - INFO - __main__ - Step 7424: {'lr': 0.0004983454271021529, 'samples': 1425408, 'steps': 7423, 'loss/train': 2.5369303226470947} +11/06/2021 22:17:14 - INFO - __main__ - Step 7425: {'lr': 0.0004983448175144294, 'samples': 1425600, 'steps': 7424, 'loss/train': 2.294490098953247} +11/06/2021 22:17:14 - INFO - __main__ - Step 7426: {'lr': 0.0004983442078148056, 'samples': 1425792, 'steps': 7425, 'loss/train': 1.7043726444244385} +11/06/2021 22:17:15 - INFO - __main__ - Step 7427: {'lr': 0.0004983435980032817, 'samples': 1425984, 'steps': 7426, 'loss/train': 1.0851516723632812} +11/06/2021 22:17:16 - INFO - __main__ - Step 7428: {'lr': 0.0004983429880798579, 'samples': 1426176, 'steps': 7427, 'loss/train': 1.8238978385925293} +11/06/2021 22:17:16 - INFO - __main__ - Step 7429: {'lr': 0.0004983423780445346, 'samples': 1426368, 'steps': 7428, 'loss/train': 2.179898977279663} +11/06/2021 22:17:16 - INFO - __main__ - Step 7430: {'lr': 0.0004983417678973123, 'samples': 1426560, 'steps': 7429, 'loss/train': 2.2200920581817627} +11/06/2021 22:17:17 - INFO - __main__ - Step 7431: {'lr': 0.0004983411576381907, 'samples': 1426752, 'steps': 7430, 'loss/train': 2.471855640411377} +11/06/2021 22:17:18 - INFO - __main__ - Step 7432: {'lr': 0.0004983405472671706, 'samples': 1426944, 'steps': 7431, 'loss/train': 1.9045939445495605} +11/06/2021 22:17:18 - INFO - __main__ - Step 7433: {'lr': 0.000498339936784252, 'samples': 1427136, 'steps': 7432, 'loss/train': 2.156907558441162} +11/06/2021 22:17:18 - INFO - __main__ - Step 7434: {'lr': 0.0004983393261894354, 'samples': 1427328, 'steps': 7433, 'loss/train': 2.357154130935669} +11/06/2021 22:17:19 - INFO - __main__ - Step 7435: {'lr': 0.0004983387154827208, 'samples': 1427520, 'steps': 7434, 'loss/train': 1.69056236743927} +11/06/2021 22:17:19 - INFO - __main__ - Step 7436: {'lr': 0.0004983381046641085, 'samples': 1427712, 'steps': 7435, 'loss/train': 1.9962103366851807} +11/06/2021 22:17:20 - INFO - __main__ - Step 7437: {'lr': 0.0004983374937335991, 'samples': 1427904, 'steps': 7436, 'loss/train': 1.3792200088500977} +11/06/2021 22:17:21 - INFO - __main__ - Step 7438: {'lr': 0.0004983368826911926, 'samples': 1428096, 'steps': 7437, 'loss/train': 1.7087842226028442} +11/06/2021 22:17:21 - INFO - __main__ - Step 7439: {'lr': 0.0004983362715368893, 'samples': 1428288, 'steps': 7438, 'loss/train': 1.5336834192276} +11/06/2021 22:17:21 - INFO - __main__ - Step 7440: {'lr': 0.0004983356602706895, 'samples': 1428480, 'steps': 7439, 'loss/train': 2.1194801330566406} +11/06/2021 22:17:22 - INFO - __main__ - Step 7441: {'lr': 0.0004983350488925936, 'samples': 1428672, 'steps': 7440, 'loss/train': 1.9883663654327393} +11/06/2021 22:17:22 - INFO - __main__ - Step 7442: {'lr': 0.0004983344374026016, 'samples': 1428864, 'steps': 7441, 'loss/train': 1.836441993713379} +11/06/2021 22:17:23 - INFO - __main__ - Step 7443: {'lr': 0.0004983338258007139, 'samples': 1429056, 'steps': 7442, 'loss/train': 1.3787864446640015} +11/06/2021 22:17:24 - INFO - __main__ - Step 7444: {'lr': 0.0004983332140869309, 'samples': 1429248, 'steps': 7443, 'loss/train': 1.911993384361267} +11/06/2021 22:17:24 - INFO - __main__ - Step 7445: {'lr': 0.0004983326022612528, 'samples': 1429440, 'steps': 7444, 'loss/train': 2.0019690990448} +11/06/2021 22:17:24 - INFO - __main__ - Step 7446: {'lr': 0.0004983319903236799, 'samples': 1429632, 'steps': 7445, 'loss/train': 2.305609941482544} +11/06/2021 22:17:25 - INFO - __main__ - Step 7447: {'lr': 0.0004983313782742124, 'samples': 1429824, 'steps': 7446, 'loss/train': 1.3778132200241089} +11/06/2021 22:17:26 - INFO - __main__ - Step 7448: {'lr': 0.0004983307661128505, 'samples': 1430016, 'steps': 7447, 'loss/train': 1.7583122253417969} +11/06/2021 22:17:26 - INFO - __main__ - Step 7449: {'lr': 0.0004983301538395948, 'samples': 1430208, 'steps': 7448, 'loss/train': 1.846149206161499} +11/06/2021 22:17:27 - INFO - __main__ - Step 7450: {'lr': 0.0004983295414544452, 'samples': 1430400, 'steps': 7449, 'loss/train': 1.9692158699035645} +11/06/2021 22:17:27 - INFO - __main__ - Step 7451: {'lr': 0.0004983289289574022, 'samples': 1430592, 'steps': 7450, 'loss/train': 1.7557963132858276} +11/06/2021 22:17:27 - INFO - __main__ - Step 7452: {'lr': 0.000498328316348466, 'samples': 1430784, 'steps': 7451, 'loss/train': 2.0076990127563477} +11/06/2021 22:17:28 - INFO - __main__ - Step 7453: {'lr': 0.0004983277036276369, 'samples': 1430976, 'steps': 7452, 'loss/train': 0.7926499843597412} +11/06/2021 22:17:29 - INFO - __main__ - Step 7454: {'lr': 0.0004983270907949152, 'samples': 1431168, 'steps': 7453, 'loss/train': 1.5046730041503906} +11/06/2021 22:17:29 - INFO - __main__ - Step 7455: {'lr': 0.0004983264778503011, 'samples': 1431360, 'steps': 7454, 'loss/train': 1.3215335607528687} +11/06/2021 22:17:29 - INFO - __main__ - Step 7456: {'lr': 0.0004983258647937949, 'samples': 1431552, 'steps': 7455, 'loss/train': 2.1020658016204834} +11/06/2021 22:17:30 - INFO - __main__ - Step 7457: {'lr': 0.0004983252516253969, 'samples': 1431744, 'steps': 7456, 'loss/train': 1.746657133102417} +11/06/2021 22:17:31 - INFO - __main__ - Step 7458: {'lr': 0.0004983246383451074, 'samples': 1431936, 'steps': 7457, 'loss/train': 2.16377329826355} +11/06/2021 22:17:31 - INFO - __main__ - Step 7459: {'lr': 0.0004983240249529267, 'samples': 1432128, 'steps': 7458, 'loss/train': 2.1467676162719727} +11/06/2021 22:17:31 - INFO - __main__ - Step 7460: {'lr': 0.000498323411448855, 'samples': 1432320, 'steps': 7459, 'loss/train': 1.7520476579666138} +11/06/2021 22:17:32 - INFO - __main__ - Step 7461: {'lr': 0.0004983227978328926, 'samples': 1432512, 'steps': 7460, 'loss/train': 2.5341601371765137} +11/06/2021 22:17:32 - INFO - __main__ - Step 7462: {'lr': 0.0004983221841050397, 'samples': 1432704, 'steps': 7461, 'loss/train': 2.3244829177856445} +11/06/2021 22:17:33 - INFO - __main__ - Step 7463: {'lr': 0.0004983215702652968, 'samples': 1432896, 'steps': 7462, 'loss/train': 1.8480935096740723} +11/06/2021 22:17:34 - INFO - __main__ - Step 7464: {'lr': 0.0004983209563136639, 'samples': 1433088, 'steps': 7463, 'loss/train': 1.939214825630188} +11/06/2021 22:17:34 - INFO - __main__ - Step 7465: {'lr': 0.0004983203422501414, 'samples': 1433280, 'steps': 7464, 'loss/train': 2.0819010734558105} +11/06/2021 22:17:34 - INFO - __main__ - Step 7466: {'lr': 0.0004983197280747297, 'samples': 1433472, 'steps': 7465, 'loss/train': 1.9236360788345337} +11/06/2021 22:17:35 - INFO - __main__ - Step 7467: {'lr': 0.0004983191137874289, 'samples': 1433664, 'steps': 7466, 'loss/train': 1.6283338069915771} +11/06/2021 22:17:35 - INFO - __main__ - Step 7468: {'lr': 0.0004983184993882394, 'samples': 1433856, 'steps': 7467, 'loss/train': 1.6667938232421875} +11/06/2021 22:17:36 - INFO - __main__ - Step 7469: {'lr': 0.0004983178848771613, 'samples': 1434048, 'steps': 7468, 'loss/train': 2.123434066772461} +11/06/2021 22:17:36 - INFO - __main__ - Step 7470: {'lr': 0.0004983172702541951, 'samples': 1434240, 'steps': 7469, 'loss/train': 1.7942487001419067} +11/06/2021 22:17:37 - INFO - __main__ - Step 7471: {'lr': 0.0004983166555193409, 'samples': 1434432, 'steps': 7470, 'loss/train': 2.0577187538146973} +11/06/2021 22:17:37 - INFO - __main__ - Step 7472: {'lr': 0.000498316040672599, 'samples': 1434624, 'steps': 7471, 'loss/train': 1.767512559890747} +11/06/2021 22:17:37 - INFO - __main__ - Step 7473: {'lr': 0.00049831542571397, 'samples': 1434816, 'steps': 7472, 'loss/train': 1.7135177850723267} +11/06/2021 22:17:38 - INFO - __main__ - Step 7474: {'lr': 0.0004983148106434536, 'samples': 1435008, 'steps': 7473, 'loss/train': 1.7563962936401367} +11/06/2021 22:17:39 - INFO - __main__ - Step 7475: {'lr': 0.0004983141954610505, 'samples': 1435200, 'steps': 7474, 'loss/train': 1.7334504127502441} +11/06/2021 22:17:39 - INFO - __main__ - Step 7476: {'lr': 0.0004983135801667608, 'samples': 1435392, 'steps': 7475, 'loss/train': 2.2196826934814453} +11/06/2021 22:17:39 - INFO - __main__ - Step 7477: {'lr': 0.0004983129647605849, 'samples': 1435584, 'steps': 7476, 'loss/train': 1.6023023128509521} +11/06/2021 22:17:40 - INFO - __main__ - Step 7478: {'lr': 0.0004983123492425229, 'samples': 1435776, 'steps': 7477, 'loss/train': 1.4602479934692383} +11/06/2021 22:17:41 - INFO - __main__ - Step 7479: {'lr': 0.0004983117336125753, 'samples': 1435968, 'steps': 7478, 'loss/train': 1.8138916492462158} +11/06/2021 22:17:41 - INFO - __main__ - Step 7480: {'lr': 0.0004983111178707422, 'samples': 1436160, 'steps': 7479, 'loss/train': 1.5433342456817627} +11/06/2021 22:17:41 - INFO - __main__ - Step 7481: {'lr': 0.0004983105020170239, 'samples': 1436352, 'steps': 7480, 'loss/train': 1.7849801778793335} +11/06/2021 22:17:42 - INFO - __main__ - Step 7482: {'lr': 0.0004983098860514209, 'samples': 1436544, 'steps': 7481, 'loss/train': 2.041818380355835} +11/06/2021 22:17:42 - INFO - __main__ - Step 7483: {'lr': 0.0004983092699739331, 'samples': 1436736, 'steps': 7482, 'loss/train': 1.6931136846542358} +11/06/2021 22:17:43 - INFO - __main__ - Step 7484: {'lr': 0.0004983086537845611, 'samples': 1436928, 'steps': 7483, 'loss/train': 1.9418973922729492} +11/06/2021 22:17:44 - INFO - __main__ - Step 7485: {'lr': 0.000498308037483305, 'samples': 1437120, 'steps': 7484, 'loss/train': 1.8237574100494385} +11/06/2021 22:17:44 - INFO - __main__ - Step 7486: {'lr': 0.0004983074210701651, 'samples': 1437312, 'steps': 7485, 'loss/train': 1.779268503189087} +11/06/2021 22:17:44 - INFO - __main__ - Step 7487: {'lr': 0.0004983068045451418, 'samples': 1437504, 'steps': 7486, 'loss/train': 2.059835433959961} +11/06/2021 22:17:45 - INFO - __main__ - Step 7488: {'lr': 0.0004983061879082352, 'samples': 1437696, 'steps': 7487, 'loss/train': 2.341383218765259} +11/06/2021 22:17:46 - INFO - __main__ - Step 7489: {'lr': 0.0004983055711594458, 'samples': 1437888, 'steps': 7488, 'loss/train': 1.6205718517303467} +11/06/2021 22:17:46 - INFO - __main__ - Step 7490: {'lr': 0.0004983049542987736, 'samples': 1438080, 'steps': 7489, 'loss/train': 1.5462263822555542} +11/06/2021 22:17:46 - INFO - __main__ - Step 7491: {'lr': 0.000498304337326219, 'samples': 1438272, 'steps': 7490, 'loss/train': 2.009598970413208} +11/06/2021 22:17:47 - INFO - __main__ - Step 7492: {'lr': 0.0004983037202417824, 'samples': 1438464, 'steps': 7491, 'loss/train': 1.6653988361358643} +11/06/2021 22:17:47 - INFO - __main__ - Step 7493: {'lr': 0.0004983031030454639, 'samples': 1438656, 'steps': 7492, 'loss/train': 1.2993390560150146} +11/06/2021 22:17:48 - INFO - __main__ - Step 7494: {'lr': 0.0004983024857372639, 'samples': 1438848, 'steps': 7493, 'loss/train': 1.8429198265075684} +11/06/2021 22:17:49 - INFO - __main__ - Step 7495: {'lr': 0.0004983018683171826, 'samples': 1439040, 'steps': 7494, 'loss/train': 1.9161350727081299} +11/06/2021 22:17:49 - INFO - __main__ - Step 7496: {'lr': 0.0004983012507852203, 'samples': 1439232, 'steps': 7495, 'loss/train': 1.8230706453323364} +11/06/2021 22:17:49 - INFO - __main__ - Step 7497: {'lr': 0.0004983006331413773, 'samples': 1439424, 'steps': 7496, 'loss/train': 1.6898235082626343} +11/06/2021 22:17:50 - INFO - __main__ - Step 7498: {'lr': 0.0004983000153856539, 'samples': 1439616, 'steps': 7497, 'loss/train': 1.4853415489196777} +11/06/2021 22:17:50 - INFO - __main__ - Step 7499: {'lr': 0.0004982993975180504, 'samples': 1439808, 'steps': 7498, 'loss/train': 2.2079527378082275} +11/06/2021 22:17:51 - INFO - __main__ - Step 7500: {'lr': 0.0004982987795385669, 'samples': 1440000, 'steps': 7499, 'loss/train': 2.117600440979004} +11/06/2021 22:17:51 - INFO - __main__ - Step 7501: {'lr': 0.0004982981614472039, 'samples': 1440192, 'steps': 7500, 'loss/train': 2.0123913288116455} +11/06/2021 22:17:52 - INFO - __main__ - Step 7502: {'lr': 0.0004982975432439615, 'samples': 1440384, 'steps': 7501, 'loss/train': 1.6575013399124146} +11/06/2021 22:17:52 - INFO - __main__ - Step 7503: {'lr': 0.0004982969249288401, 'samples': 1440576, 'steps': 7502, 'loss/train': 0.48864415287971497} +11/06/2021 22:17:53 - INFO - __main__ - Step 7504: {'lr': 0.0004982963065018399, 'samples': 1440768, 'steps': 7503, 'loss/train': 2.1326282024383545} +11/06/2021 22:17:54 - INFO - __main__ - Step 7505: {'lr': 0.0004982956879629612, 'samples': 1440960, 'steps': 7504, 'loss/train': 2.184455633163452} +11/06/2021 22:17:54 - INFO - __main__ - Step 7506: {'lr': 0.0004982950693122044, 'samples': 1441152, 'steps': 7505, 'loss/train': 1.8725202083587646} +11/06/2021 22:17:54 - INFO - __main__ - Step 7507: {'lr': 0.0004982944505495696, 'samples': 1441344, 'steps': 7506, 'loss/train': 1.6214361190795898} +11/06/2021 22:17:55 - INFO - __main__ - Step 7508: {'lr': 0.0004982938316750572, 'samples': 1441536, 'steps': 7507, 'loss/train': 2.0111021995544434} +11/06/2021 22:17:55 - INFO - __main__ - Step 7509: {'lr': 0.0004982932126886674, 'samples': 1441728, 'steps': 7508, 'loss/train': 1.670443058013916} +11/06/2021 22:17:56 - INFO - __main__ - Step 7510: {'lr': 0.0004982925935904004, 'samples': 1441920, 'steps': 7509, 'loss/train': 1.7598836421966553} +11/06/2021 22:17:56 - INFO - __main__ - Step 7511: {'lr': 0.0004982919743802567, 'samples': 1442112, 'steps': 7510, 'loss/train': 2.0992119312286377} +11/06/2021 22:17:57 - INFO - __main__ - Step 7512: {'lr': 0.0004982913550582364, 'samples': 1442304, 'steps': 7511, 'loss/train': 1.790313720703125} +11/06/2021 22:17:57 - INFO - __main__ - Step 7513: {'lr': 0.00049829073562434, 'samples': 1442496, 'steps': 7512, 'loss/train': 1.9669575691223145} +11/06/2021 22:17:57 - INFO - __main__ - Step 7514: {'lr': 0.0004982901160785675, 'samples': 1442688, 'steps': 7513, 'loss/train': 1.6649370193481445} +11/06/2021 22:17:58 - INFO - __main__ - Step 7515: {'lr': 0.0004982894964209193, 'samples': 1442880, 'steps': 7514, 'loss/train': 2.0550930500030518} +11/06/2021 22:17:59 - INFO - __main__ - Step 7516: {'lr': 0.0004982888766513957, 'samples': 1443072, 'steps': 7515, 'loss/train': 1.5787222385406494} +11/06/2021 22:17:59 - INFO - __main__ - Step 7517: {'lr': 0.000498288256769997, 'samples': 1443264, 'steps': 7516, 'loss/train': 1.9650318622589111} +11/06/2021 22:17:59 - INFO - __main__ - Step 7518: {'lr': 0.0004982876367767234, 'samples': 1443456, 'steps': 7517, 'loss/train': 2.108997106552124} +11/06/2021 22:18:00 - INFO - __main__ - Step 7519: {'lr': 0.0004982870166715753, 'samples': 1443648, 'steps': 7518, 'loss/train': 1.5011414289474487} +11/06/2021 22:18:01 - INFO - __main__ - Step 7520: {'lr': 0.0004982863964545529, 'samples': 1443840, 'steps': 7519, 'loss/train': 2.0259969234466553} +11/06/2021 22:18:01 - INFO - __main__ - Step 7521: {'lr': 0.0004982857761256564, 'samples': 1444032, 'steps': 7520, 'loss/train': 2.0949344635009766} +11/06/2021 22:18:01 - INFO - __main__ - Step 7522: {'lr': 0.0004982851556848861, 'samples': 1444224, 'steps': 7521, 'loss/train': 1.771378993988037} +11/06/2021 22:18:02 - INFO - __main__ - Step 7523: {'lr': 0.0004982845351322424, 'samples': 1444416, 'steps': 7522, 'loss/train': 1.6753596067428589} +11/06/2021 22:18:02 - INFO - __main__ - Step 7524: {'lr': 0.0004982839144677257, 'samples': 1444608, 'steps': 7523, 'loss/train': 0.8086962103843689} +11/06/2021 22:18:03 - INFO - __main__ - Step 7525: {'lr': 0.0004982832936913359, 'samples': 1444800, 'steps': 7524, 'loss/train': 1.749570608139038} +11/06/2021 22:18:04 - INFO - __main__ - Step 7526: {'lr': 0.0004982826728030735, 'samples': 1444992, 'steps': 7525, 'loss/train': 1.9992296695709229} +11/06/2021 22:18:04 - INFO - __main__ - Step 7527: {'lr': 0.0004982820518029387, 'samples': 1445184, 'steps': 7526, 'loss/train': 2.0168237686157227} +11/06/2021 22:18:04 - INFO - __main__ - Step 7528: {'lr': 0.000498281430690932, 'samples': 1445376, 'steps': 7527, 'loss/train': 1.9467054605484009} +11/06/2021 22:18:05 - INFO - __main__ - Step 7529: {'lr': 0.0004982808094670534, 'samples': 1445568, 'steps': 7528, 'loss/train': 1.8640716075897217} +11/06/2021 22:18:05 - INFO - __main__ - Step 7530: {'lr': 0.0004982801881313034, 'samples': 1445760, 'steps': 7529, 'loss/train': 1.9027869701385498} +11/06/2021 22:18:06 - INFO - __main__ - Step 7531: {'lr': 0.0004982795666836821, 'samples': 1445952, 'steps': 7530, 'loss/train': 1.8328138589859009} +11/06/2021 22:18:06 - INFO - __main__ - Step 7532: {'lr': 0.00049827894512419, 'samples': 1446144, 'steps': 7531, 'loss/train': 2.27284836769104} +11/06/2021 22:18:07 - INFO - __main__ - Step 7533: {'lr': 0.000498278323452827, 'samples': 1446336, 'steps': 7532, 'loss/train': 1.7987669706344604} +11/06/2021 22:18:07 - INFO - __main__ - Step 7534: {'lr': 0.0004982777016695937, 'samples': 1446528, 'steps': 7533, 'loss/train': 1.1510889530181885} +11/06/2021 22:18:08 - INFO - __main__ - Step 7535: {'lr': 0.0004982770797744904, 'samples': 1446720, 'steps': 7534, 'loss/train': 1.9908004999160767} +11/06/2021 22:18:09 - INFO - __main__ - Step 7536: {'lr': 0.0004982764577675172, 'samples': 1446912, 'steps': 7535, 'loss/train': 2.135575532913208} +11/06/2021 22:18:09 - INFO - __main__ - Step 7537: {'lr': 0.0004982758356486746, 'samples': 1447104, 'steps': 7536, 'loss/train': 1.4963163137435913} +11/06/2021 22:18:09 - INFO - __main__ - Step 7538: {'lr': 0.0004982752134179624, 'samples': 1447296, 'steps': 7537, 'loss/train': 2.040847063064575} +11/06/2021 22:18:10 - INFO - __main__ - Step 7539: {'lr': 0.0004982745910753815, 'samples': 1447488, 'steps': 7538, 'loss/train': 2.0529308319091797} +11/06/2021 22:18:10 - INFO - __main__ - Step 7540: {'lr': 0.0004982739686209319, 'samples': 1447680, 'steps': 7539, 'loss/train': 1.5102424621582031} +11/06/2021 22:18:10 - INFO - __main__ - Step 7541: {'lr': 0.0004982733460546138, 'samples': 1447872, 'steps': 7540, 'loss/train': 2.3759987354278564} +11/06/2021 22:18:11 - INFO - __main__ - Step 7542: {'lr': 0.0004982727233764276, 'samples': 1448064, 'steps': 7541, 'loss/train': 1.264660120010376} +11/06/2021 22:18:12 - INFO - __main__ - Step 7543: {'lr': 0.0004982721005863734, 'samples': 1448256, 'steps': 7542, 'loss/train': 2.076897621154785} +11/06/2021 22:18:12 - INFO - __main__ - Step 7544: {'lr': 0.0004982714776844518, 'samples': 1448448, 'steps': 7543, 'loss/train': 1.9812895059585571} +11/06/2021 22:18:13 - INFO - __main__ - Step 7545: {'lr': 0.0004982708546706628, 'samples': 1448640, 'steps': 7544, 'loss/train': 1.7536218166351318} +11/06/2021 22:18:13 - INFO - __main__ - Step 7546: {'lr': 0.0004982702315450068, 'samples': 1448832, 'steps': 7545, 'loss/train': 2.1761927604675293} +11/06/2021 22:18:14 - INFO - __main__ - Step 7547: {'lr': 0.0004982696083074841, 'samples': 1449024, 'steps': 7546, 'loss/train': 1.766358494758606} +11/06/2021 22:18:14 - INFO - __main__ - Step 7548: {'lr': 0.0004982689849580951, 'samples': 1449216, 'steps': 7547, 'loss/train': 0.7626532912254333} +11/06/2021 22:18:15 - INFO - __main__ - Step 7549: {'lr': 0.0004982683614968396, 'samples': 1449408, 'steps': 7548, 'loss/train': 1.5238088369369507} +11/06/2021 22:18:15 - INFO - __main__ - Step 7550: {'lr': 0.0004982677379237185, 'samples': 1449600, 'steps': 7549, 'loss/train': 1.834945797920227} +11/06/2021 22:18:15 - INFO - __main__ - Step 7551: {'lr': 0.0004982671142387316, 'samples': 1449792, 'steps': 7550, 'loss/train': 1.1642390489578247} +11/06/2021 22:18:17 - INFO - __main__ - Step 7552: {'lr': 0.0004982664904418794, 'samples': 1449984, 'steps': 7551, 'loss/train': 0.791139543056488} +11/06/2021 22:18:17 - INFO - __main__ - Step 7553: {'lr': 0.0004982658665331622, 'samples': 1450176, 'steps': 7552, 'loss/train': 2.0422914028167725} +11/06/2021 22:18:17 - INFO - __main__ - Step 7554: {'lr': 0.0004982652425125802, 'samples': 1450368, 'steps': 7553, 'loss/train': 2.1857669353485107} +11/06/2021 22:18:18 - INFO - __main__ - Step 7555: {'lr': 0.0004982646183801337, 'samples': 1450560, 'steps': 7554, 'loss/train': 2.560479164123535} +11/06/2021 22:18:18 - INFO - __main__ - Step 7556: {'lr': 0.000498263994135823, 'samples': 1450752, 'steps': 7555, 'loss/train': 2.5498902797698975} +11/06/2021 22:18:18 - INFO - __main__ - Step 7557: {'lr': 0.0004982633697796484, 'samples': 1450944, 'steps': 7556, 'loss/train': 2.1660470962524414} +11/06/2021 22:18:19 - INFO - __main__ - Step 7558: {'lr': 0.0004982627453116102, 'samples': 1451136, 'steps': 7557, 'loss/train': 1.7757936716079712} +11/06/2021 22:18:20 - INFO - __main__ - Step 7559: {'lr': 0.0004982621207317086, 'samples': 1451328, 'steps': 7558, 'loss/train': 1.7856800556182861} +11/06/2021 22:18:20 - INFO - __main__ - Step 7560: {'lr': 0.0004982614960399439, 'samples': 1451520, 'steps': 7559, 'loss/train': 1.483529806137085} +11/06/2021 22:18:20 - INFO - __main__ - Step 7561: {'lr': 0.0004982608712363163, 'samples': 1451712, 'steps': 7560, 'loss/train': 2.1394612789154053} +11/06/2021 22:18:21 - INFO - __main__ - Step 7562: {'lr': 0.0004982602463208263, 'samples': 1451904, 'steps': 7561, 'loss/train': 2.436344861984253} +11/06/2021 22:18:22 - INFO - __main__ - Step 7563: {'lr': 0.0004982596212934742, 'samples': 1452096, 'steps': 7562, 'loss/train': 2.3320164680480957} +11/06/2021 22:18:22 - INFO - __main__ - Step 7564: {'lr': 0.00049825899615426, 'samples': 1452288, 'steps': 7563, 'loss/train': 1.0937427282333374} +11/06/2021 22:18:22 - INFO - __main__ - Step 7565: {'lr': 0.000498258370903184, 'samples': 1452480, 'steps': 7564, 'loss/train': 1.8388676643371582} +11/06/2021 22:18:23 - INFO - __main__ - Step 7566: {'lr': 0.0004982577455402467, 'samples': 1452672, 'steps': 7565, 'loss/train': 1.7357767820358276} +11/06/2021 22:18:23 - INFO - __main__ - Step 7567: {'lr': 0.0004982571200654485, 'samples': 1452864, 'steps': 7566, 'loss/train': 1.5761942863464355} +11/06/2021 22:18:24 - INFO - __main__ - Step 7568: {'lr': 0.0004982564944787892, 'samples': 1453056, 'steps': 7567, 'loss/train': 2.1120853424072266} +11/06/2021 22:18:25 - INFO - __main__ - Step 7569: {'lr': 0.0004982558687802695, 'samples': 1453248, 'steps': 7568, 'loss/train': 2.013747453689575} +11/06/2021 22:18:25 - INFO - __main__ - Step 7570: {'lr': 0.0004982552429698894, 'samples': 1453440, 'steps': 7569, 'loss/train': 2.029210090637207} +11/06/2021 22:18:25 - INFO - __main__ - Step 7571: {'lr': 0.0004982546170476494, 'samples': 1453632, 'steps': 7570, 'loss/train': 1.5686355829238892} +11/06/2021 22:18:26 - INFO - __main__ - Step 7572: {'lr': 0.0004982539910135497, 'samples': 1453824, 'steps': 7571, 'loss/train': 1.8889784812927246} +11/06/2021 22:18:27 - INFO - __main__ - Step 7573: {'lr': 0.0004982533648675906, 'samples': 1454016, 'steps': 7572, 'loss/train': 2.56605863571167} +11/06/2021 22:18:27 - INFO - __main__ - Step 7574: {'lr': 0.0004982527386097723, 'samples': 1454208, 'steps': 7573, 'loss/train': 1.9748719930648804} +11/06/2021 22:18:27 - INFO - __main__ - Step 7575: {'lr': 0.0004982521122400953, 'samples': 1454400, 'steps': 7574, 'loss/train': 1.4213409423828125} +11/06/2021 22:18:28 - INFO - __main__ - Step 7576: {'lr': 0.0004982514857585596, 'samples': 1454592, 'steps': 7575, 'loss/train': 1.8690491914749146} +11/06/2021 22:18:28 - INFO - __main__ - Step 7577: {'lr': 0.0004982508591651657, 'samples': 1454784, 'steps': 7576, 'loss/train': 2.0668842792510986} +11/06/2021 22:18:29 - INFO - __main__ - Step 7578: {'lr': 0.0004982502324599137, 'samples': 1454976, 'steps': 7577, 'loss/train': 2.21287202835083} +11/06/2021 22:18:29 - INFO - __main__ - Step 7579: {'lr': 0.000498249605642804, 'samples': 1455168, 'steps': 7578, 'loss/train': 1.7789140939712524} +11/06/2021 22:18:30 - INFO - __main__ - Step 7580: {'lr': 0.0004982489787138369, 'samples': 1455360, 'steps': 7579, 'loss/train': 1.9952287673950195} +11/06/2021 22:18:30 - INFO - __main__ - Step 7581: {'lr': 0.0004982483516730126, 'samples': 1455552, 'steps': 7580, 'loss/train': 1.8334144353866577} +11/06/2021 22:18:30 - INFO - __main__ - Step 7582: {'lr': 0.0004982477245203314, 'samples': 1455744, 'steps': 7581, 'loss/train': 1.755232572555542} +11/06/2021 22:18:31 - INFO - __main__ - Step 7583: {'lr': 0.0004982470972557936, 'samples': 1455936, 'steps': 7582, 'loss/train': 2.4827017784118652} +11/06/2021 22:18:32 - INFO - __main__ - Step 7584: {'lr': 0.0004982464698793995, 'samples': 1456128, 'steps': 7583, 'loss/train': 1.831977128982544} +11/06/2021 22:18:32 - INFO - __main__ - Step 7585: {'lr': 0.0004982458423911495, 'samples': 1456320, 'steps': 7584, 'loss/train': 2.0919387340545654} +11/06/2021 22:18:32 - INFO - __main__ - Step 7586: {'lr': 0.0004982452147910437, 'samples': 1456512, 'steps': 7585, 'loss/train': 2.820591449737549} +11/06/2021 22:18:33 - INFO - __main__ - Step 7587: {'lr': 0.0004982445870790823, 'samples': 1456704, 'steps': 7586, 'loss/train': 1.7887145280838013} +11/06/2021 22:18:34 - INFO - __main__ - Step 7588: {'lr': 0.0004982439592552658, 'samples': 1456896, 'steps': 7587, 'loss/train': 1.2820543050765991} +11/06/2021 22:18:35 - INFO - __main__ - Step 7589: {'lr': 0.0004982433313195945, 'samples': 1457088, 'steps': 7588, 'loss/train': 2.508904218673706} +11/06/2021 22:18:35 - INFO - __main__ - Step 7590: {'lr': 0.0004982427032720685, 'samples': 1457280, 'steps': 7589, 'loss/train': 1.968804121017456} +11/06/2021 22:18:35 - INFO - __main__ - Step 7591: {'lr': 0.0004982420751126882, 'samples': 1457472, 'steps': 7590, 'loss/train': 2.2515952587127686} +11/06/2021 22:18:36 - INFO - __main__ - Step 7592: {'lr': 0.0004982414468414538, 'samples': 1457664, 'steps': 7591, 'loss/train': 2.3000688552856445} +11/06/2021 22:18:36 - INFO - __main__ - Step 7593: {'lr': 0.0004982408184583656, 'samples': 1457856, 'steps': 7592, 'loss/train': 1.6771053075790405} +11/06/2021 22:18:37 - INFO - __main__ - Step 7594: {'lr': 0.000498240189963424, 'samples': 1458048, 'steps': 7593, 'loss/train': 1.5368093252182007} +11/06/2021 22:18:37 - INFO - __main__ - Step 7595: {'lr': 0.0004982395613566291, 'samples': 1458240, 'steps': 7594, 'loss/train': 2.213350772857666} +11/06/2021 22:18:38 - INFO - __main__ - Step 7596: {'lr': 0.0004982389326379814, 'samples': 1458432, 'steps': 7595, 'loss/train': 1.887166142463684} +11/06/2021 22:18:38 - INFO - __main__ - Step 7597: {'lr': 0.000498238303807481, 'samples': 1458624, 'steps': 7596, 'loss/train': 2.0999624729156494} +11/06/2021 22:18:38 - INFO - __main__ - Step 7598: {'lr': 0.0004982376748651283, 'samples': 1458816, 'steps': 7597, 'loss/train': 1.3151088953018188} +11/06/2021 22:18:39 - INFO - __main__ - Step 7599: {'lr': 0.0004982370458109235, 'samples': 1459008, 'steps': 7598, 'loss/train': 1.5262982845306396} +11/06/2021 22:18:40 - INFO - __main__ - Step 7600: {'lr': 0.0004982364166448669, 'samples': 1459200, 'steps': 7599, 'loss/train': 1.9225597381591797} +11/06/2021 22:18:40 - INFO - __main__ - Step 7601: {'lr': 0.0004982357873669588, 'samples': 1459392, 'steps': 7600, 'loss/train': 1.6969056129455566} +11/06/2021 22:18:40 - INFO - __main__ - Step 7602: {'lr': 0.0004982351579771995, 'samples': 1459584, 'steps': 7601, 'loss/train': 1.8867172002792358} +11/06/2021 22:18:41 - INFO - __main__ - Step 7603: {'lr': 0.0004982345284755893, 'samples': 1459776, 'steps': 7602, 'loss/train': 2.111384868621826} +11/06/2021 22:18:41 - INFO - __main__ - Step 7604: {'lr': 0.0004982338988621284, 'samples': 1459968, 'steps': 7603, 'loss/train': 1.420168161392212} +11/06/2021 22:18:42 - INFO - __main__ - Step 7605: {'lr': 0.0004982332691368172, 'samples': 1460160, 'steps': 7604, 'loss/train': 2.9915659427642822} +11/06/2021 22:18:43 - INFO - __main__ - Step 7606: {'lr': 0.0004982326392996559, 'samples': 1460352, 'steps': 7605, 'loss/train': 1.3998850584030151} +11/06/2021 22:18:43 - INFO - __main__ - Step 7607: {'lr': 0.0004982320093506449, 'samples': 1460544, 'steps': 7606, 'loss/train': 1.5841953754425049} +11/06/2021 22:18:43 - INFO - __main__ - Step 7608: {'lr': 0.0004982313792897843, 'samples': 1460736, 'steps': 7607, 'loss/train': 1.2424761056900024} +11/06/2021 22:18:44 - INFO - __main__ - Step 7609: {'lr': 0.0004982307491170744, 'samples': 1460928, 'steps': 7608, 'loss/train': 2.063056707382202} +11/06/2021 22:18:45 - INFO - __main__ - Step 7610: {'lr': 0.0004982301188325156, 'samples': 1461120, 'steps': 7609, 'loss/train': 1.6519533395767212} +11/06/2021 22:18:45 - INFO - __main__ - Step 7611: {'lr': 0.0004982294884361081, 'samples': 1461312, 'steps': 7610, 'loss/train': 1.2619507312774658} +11/06/2021 22:18:45 - INFO - __main__ - Step 7612: {'lr': 0.0004982288579278522, 'samples': 1461504, 'steps': 7611, 'loss/train': 1.7545194625854492} +11/06/2021 22:18:46 - INFO - __main__ - Step 7613: {'lr': 0.0004982282273077483, 'samples': 1461696, 'steps': 7612, 'loss/train': 1.8897991180419922} +11/06/2021 22:18:46 - INFO - __main__ - Step 7614: {'lr': 0.0004982275965757965, 'samples': 1461888, 'steps': 7613, 'loss/train': 1.383413314819336} +11/06/2021 22:18:47 - INFO - __main__ - Step 7615: {'lr': 0.0004982269657319974, 'samples': 1462080, 'steps': 7614, 'loss/train': 1.955425500869751} +11/06/2021 22:18:47 - INFO - __main__ - Step 7616: {'lr': 0.0004982263347763508, 'samples': 1462272, 'steps': 7615, 'loss/train': 1.6622871160507202} +11/06/2021 22:18:48 - INFO - __main__ - Step 7617: {'lr': 0.0004982257037088574, 'samples': 1462464, 'steps': 7616, 'loss/train': 1.82854425907135} +11/06/2021 22:18:48 - INFO - __main__ - Step 7618: {'lr': 0.0004982250725295173, 'samples': 1462656, 'steps': 7617, 'loss/train': 2.0947282314300537} +11/06/2021 22:18:48 - INFO - __main__ - Step 7619: {'lr': 0.0004982244412383307, 'samples': 1462848, 'steps': 7618, 'loss/train': 1.5993701219558716} +11/06/2021 22:18:49 - INFO - __main__ - Step 7620: {'lr': 0.0004982238098352981, 'samples': 1463040, 'steps': 7619, 'loss/train': 2.0519866943359375} +11/06/2021 22:18:50 - INFO - __main__ - Step 7621: {'lr': 0.0004982231783204196, 'samples': 1463232, 'steps': 7620, 'loss/train': 1.768385887145996} +11/06/2021 22:18:50 - INFO - __main__ - Step 7622: {'lr': 0.0004982225466936957, 'samples': 1463424, 'steps': 7621, 'loss/train': 2.114351749420166} +11/06/2021 22:18:51 - INFO - __main__ - Step 7623: {'lr': 0.0004982219149551265, 'samples': 1463616, 'steps': 7622, 'loss/train': 2.196870803833008} +11/06/2021 22:18:51 - INFO - __main__ - Step 7624: {'lr': 0.0004982212831047123, 'samples': 1463808, 'steps': 7623, 'loss/train': 2.04628586769104} +11/06/2021 22:18:51 - INFO - __main__ - Step 7625: {'lr': 0.0004982206511424534, 'samples': 1464000, 'steps': 7624, 'loss/train': 1.2371141910552979} +11/06/2021 22:18:52 - INFO - __main__ - Step 7626: {'lr': 0.0004982200190683502, 'samples': 1464192, 'steps': 7625, 'loss/train': 1.4562172889709473} +11/06/2021 22:18:53 - INFO - __main__ - Step 7627: {'lr': 0.0004982193868824028, 'samples': 1464384, 'steps': 7626, 'loss/train': 1.9983298778533936} +11/06/2021 22:18:53 - INFO - __main__ - Step 7628: {'lr': 0.0004982187545846116, 'samples': 1464576, 'steps': 7627, 'loss/train': 2.135972261428833} +11/06/2021 22:18:53 - INFO - __main__ - Step 7629: {'lr': 0.0004982181221749769, 'samples': 1464768, 'steps': 7628, 'loss/train': 2.405860424041748} +11/06/2021 22:18:54 - INFO - __main__ - Step 7630: {'lr': 0.0004982174896534989, 'samples': 1464960, 'steps': 7629, 'loss/train': 1.3668652772903442} +11/06/2021 22:18:55 - INFO - __main__ - Step 7631: {'lr': 0.0004982168570201779, 'samples': 1465152, 'steps': 7630, 'loss/train': 1.261794924736023} +11/06/2021 22:18:55 - INFO - __main__ - Step 7632: {'lr': 0.0004982162242750143, 'samples': 1465344, 'steps': 7631, 'loss/train': 1.8205006122589111} +11/06/2021 22:18:55 - INFO - __main__ - Step 7633: {'lr': 0.0004982155914180082, 'samples': 1465536, 'steps': 7632, 'loss/train': 1.8356959819793701} +11/06/2021 22:18:56 - INFO - __main__ - Step 7634: {'lr': 0.0004982149584491601, 'samples': 1465728, 'steps': 7633, 'loss/train': 2.227440357208252} +11/06/2021 22:18:56 - INFO - __main__ - Step 7635: {'lr': 0.0004982143253684701, 'samples': 1465920, 'steps': 7634, 'loss/train': 1.8960446119308472} +11/06/2021 22:18:57 - INFO - __main__ - Step 7636: {'lr': 0.0004982136921759385, 'samples': 1466112, 'steps': 7635, 'loss/train': 1.77176833152771} +11/06/2021 22:18:57 - INFO - __main__ - Step 7637: {'lr': 0.0004982130588715657, 'samples': 1466304, 'steps': 7636, 'loss/train': 1.8046529293060303} +11/06/2021 22:18:58 - INFO - __main__ - Step 7638: {'lr': 0.000498212425455352, 'samples': 1466496, 'steps': 7637, 'loss/train': 1.6778465509414673} +11/06/2021 22:18:58 - INFO - __main__ - Step 7639: {'lr': 0.0004982117919272975, 'samples': 1466688, 'steps': 7638, 'loss/train': 1.662865400314331} +11/06/2021 22:18:59 - INFO - __main__ - Step 7640: {'lr': 0.0004982111582874026, 'samples': 1466880, 'steps': 7639, 'loss/train': 1.8962922096252441} +11/06/2021 22:18:59 - INFO - __main__ - Step 7641: {'lr': 0.0004982105245356676, 'samples': 1467072, 'steps': 7640, 'loss/train': 1.8994383811950684} +11/06/2021 22:19:00 - INFO - __main__ - Step 7642: {'lr': 0.0004982098906720928, 'samples': 1467264, 'steps': 7641, 'loss/train': 1.8286490440368652} +11/06/2021 22:19:00 - INFO - __main__ - Step 7643: {'lr': 0.0004982092566966785, 'samples': 1467456, 'steps': 7642, 'loss/train': 1.5329943895339966} +11/06/2021 22:19:01 - INFO - __main__ - Step 7644: {'lr': 0.0004982086226094248, 'samples': 1467648, 'steps': 7643, 'loss/train': 2.1548547744750977} +11/06/2021 22:19:01 - INFO - __main__ - Step 7645: {'lr': 0.0004982079884103322, 'samples': 1467840, 'steps': 7644, 'loss/train': 2.1634531021118164} +11/06/2021 22:19:02 - INFO - __main__ - Step 7646: {'lr': 0.0004982073540994009, 'samples': 1468032, 'steps': 7645, 'loss/train': 2.008009195327759} +11/06/2021 22:19:02 - INFO - __main__ - Step 7647: {'lr': 0.0004982067196766312, 'samples': 1468224, 'steps': 7646, 'loss/train': 1.8204351663589478} +11/06/2021 22:19:03 - INFO - __main__ - Step 7648: {'lr': 0.0004982060851420235, 'samples': 1468416, 'steps': 7647, 'loss/train': 2.1249916553497314} +11/06/2021 22:19:03 - INFO - __main__ - Step 7649: {'lr': 0.0004982054504955778, 'samples': 1468608, 'steps': 7648, 'loss/train': 1.6242306232452393} +11/06/2021 22:19:03 - INFO - __main__ - Step 7650: {'lr': 0.0004982048157372946, 'samples': 1468800, 'steps': 7649, 'loss/train': 1.693130612373352} +11/06/2021 22:19:04 - INFO - __main__ - Step 7651: {'lr': 0.0004982041808671741, 'samples': 1468992, 'steps': 7650, 'loss/train': 2.0973668098449707} +11/06/2021 22:19:05 - INFO - __main__ - Step 7652: {'lr': 0.0004982035458852168, 'samples': 1469184, 'steps': 7651, 'loss/train': 2.164299488067627} +11/06/2021 22:19:05 - INFO - __main__ - Step 7653: {'lr': 0.0004982029107914226, 'samples': 1469376, 'steps': 7652, 'loss/train': 2.062432289123535} +11/06/2021 22:19:05 - INFO - __main__ - Step 7654: {'lr': 0.0004982022755857921, 'samples': 1469568, 'steps': 7653, 'loss/train': 2.0671913623809814} +11/06/2021 22:19:06 - INFO - __main__ - Step 7655: {'lr': 0.0004982016402683255, 'samples': 1469760, 'steps': 7654, 'loss/train': 2.361668348312378} +11/06/2021 22:19:06 - INFO - __main__ - Step 7656: {'lr': 0.000498201004839023, 'samples': 1469952, 'steps': 7655, 'loss/train': 1.3417774438858032} +11/06/2021 22:19:07 - INFO - __main__ - Step 7657: {'lr': 0.000498200369297885, 'samples': 1470144, 'steps': 7656, 'loss/train': 1.8992770910263062} +11/06/2021 22:19:08 - INFO - __main__ - Step 7658: {'lr': 0.0004981997336449118, 'samples': 1470336, 'steps': 7657, 'loss/train': 1.9563990831375122} +11/06/2021 22:19:08 - INFO - __main__ - Step 7659: {'lr': 0.0004981990978801035, 'samples': 1470528, 'steps': 7658, 'loss/train': 2.046013593673706} +11/06/2021 22:19:08 - INFO - __main__ - Step 7660: {'lr': 0.0004981984620034606, 'samples': 1470720, 'steps': 7659, 'loss/train': 1.6640254259109497} +11/06/2021 22:19:09 - INFO - __main__ - Step 7661: {'lr': 0.0004981978260149833, 'samples': 1470912, 'steps': 7660, 'loss/train': 1.9074742794036865} +11/06/2021 22:19:10 - INFO - __main__ - Step 7662: {'lr': 0.0004981971899146719, 'samples': 1471104, 'steps': 7661, 'loss/train': 2.0889925956726074} +11/06/2021 22:19:10 - INFO - __main__ - Step 7663: {'lr': 0.0004981965537025267, 'samples': 1471296, 'steps': 7662, 'loss/train': 2.0140273571014404} +11/06/2021 22:19:10 - INFO - __main__ - Step 7664: {'lr': 0.000498195917378548, 'samples': 1471488, 'steps': 7663, 'loss/train': 1.5945501327514648} +11/06/2021 22:19:11 - INFO - __main__ - Step 7665: {'lr': 0.0004981952809427359, 'samples': 1471680, 'steps': 7664, 'loss/train': 1.7172966003417969} +11/06/2021 22:19:11 - INFO - __main__ - Step 7666: {'lr': 0.0004981946443950909, 'samples': 1471872, 'steps': 7665, 'loss/train': 1.3649691343307495} +11/06/2021 22:19:12 - INFO - __main__ - Step 7667: {'lr': 0.0004981940077356132, 'samples': 1472064, 'steps': 7666, 'loss/train': 0.8751164674758911} +11/06/2021 22:19:12 - INFO - __main__ - Step 7668: {'lr': 0.0004981933709643032, 'samples': 1472256, 'steps': 7667, 'loss/train': 1.916032314300537} +11/06/2021 22:19:13 - INFO - __main__ - Step 7669: {'lr': 0.000498192734081161, 'samples': 1472448, 'steps': 7668, 'loss/train': 1.9548919200897217} +11/06/2021 22:19:13 - INFO - __main__ - Step 7670: {'lr': 0.000498192097086187, 'samples': 1472640, 'steps': 7669, 'loss/train': 1.8466298580169678} +11/06/2021 22:19:13 - INFO - __main__ - Step 7671: {'lr': 0.0004981914599793816, 'samples': 1472832, 'steps': 7670, 'loss/train': 3.0567245483398438} +11/06/2021 22:19:14 - INFO - __main__ - Step 7672: {'lr': 0.0004981908227607448, 'samples': 1473024, 'steps': 7671, 'loss/train': 1.7764103412628174} +11/06/2021 22:19:15 - INFO - __main__ - Step 7673: {'lr': 0.0004981901854302771, 'samples': 1473216, 'steps': 7672, 'loss/train': 2.425710678100586} +11/06/2021 22:19:15 - INFO - __main__ - Step 7674: {'lr': 0.0004981895479879787, 'samples': 1473408, 'steps': 7673, 'loss/train': 1.5297969579696655} +11/06/2021 22:19:15 - INFO - __main__ - Step 7675: {'lr': 0.0004981889104338499, 'samples': 1473600, 'steps': 7674, 'loss/train': 1.673049807548523} +11/06/2021 22:19:16 - INFO - __main__ - Step 7676: {'lr': 0.0004981882727678912, 'samples': 1473792, 'steps': 7675, 'loss/train': 1.8792694807052612} +11/06/2021 22:19:17 - INFO - __main__ - Step 7677: {'lr': 0.0004981876349901025, 'samples': 1473984, 'steps': 7676, 'loss/train': 1.6450796127319336} +11/06/2021 22:19:17 - INFO - __main__ - Step 7678: {'lr': 0.0004981869971004843, 'samples': 1474176, 'steps': 7677, 'loss/train': 1.8612487316131592} +11/06/2021 22:19:18 - INFO - __main__ - Step 7679: {'lr': 0.0004981863590990369, 'samples': 1474368, 'steps': 7678, 'loss/train': 1.9628400802612305} +11/06/2021 22:19:18 - INFO - __main__ - Step 7680: {'lr': 0.0004981857209857605, 'samples': 1474560, 'steps': 7679, 'loss/train': 2.1773593425750732} +11/06/2021 22:19:18 - INFO - __main__ - Step 7681: {'lr': 0.0004981850827606556, 'samples': 1474752, 'steps': 7680, 'loss/train': 2.009646415710449} +11/06/2021 22:19:19 - INFO - __main__ - Step 7682: {'lr': 0.0004981844444237223, 'samples': 1474944, 'steps': 7681, 'loss/train': 1.6620737314224243} +11/06/2021 22:19:20 - INFO - __main__ - Step 7683: {'lr': 0.0004981838059749607, 'samples': 1475136, 'steps': 7682, 'loss/train': 1.8136749267578125} +11/06/2021 22:19:20 - INFO - __main__ - Step 7684: {'lr': 0.0004981831674143716, 'samples': 1475328, 'steps': 7683, 'loss/train': 2.1339547634124756} +11/06/2021 22:19:20 - INFO - __main__ - Step 7685: {'lr': 0.0004981825287419549, 'samples': 1475520, 'steps': 7684, 'loss/train': 1.375860571861267} +11/06/2021 22:19:21 - INFO - __main__ - Step 7686: {'lr': 0.0004981818899577108, 'samples': 1475712, 'steps': 7685, 'loss/train': 1.8953708410263062} +11/06/2021 22:19:21 - INFO - __main__ - Step 7687: {'lr': 0.0004981812510616399, 'samples': 1475904, 'steps': 7686, 'loss/train': 1.9942034482955933} +11/06/2021 22:19:22 - INFO - __main__ - Step 7688: {'lr': 0.0004981806120537424, 'samples': 1476096, 'steps': 7687, 'loss/train': 1.7413487434387207} +11/06/2021 22:19:22 - INFO - __main__ - Step 7689: {'lr': 0.0004981799729340185, 'samples': 1476288, 'steps': 7688, 'loss/train': 1.861914038658142} +11/06/2021 22:19:23 - INFO - __main__ - Step 7690: {'lr': 0.0004981793337024685, 'samples': 1476480, 'steps': 7689, 'loss/train': 1.644492745399475} +11/06/2021 22:19:23 - INFO - __main__ - Step 7691: {'lr': 0.0004981786943590928, 'samples': 1476672, 'steps': 7690, 'loss/train': 1.96816885471344} +11/06/2021 22:19:24 - INFO - __main__ - Step 7692: {'lr': 0.0004981780549038916, 'samples': 1476864, 'steps': 7691, 'loss/train': 1.6738519668579102} +11/06/2021 22:19:25 - INFO - __main__ - Step 7693: {'lr': 0.0004981774153368651, 'samples': 1477056, 'steps': 7692, 'loss/train': 1.7269313335418701} +11/06/2021 22:19:25 - INFO - __main__ - Step 7694: {'lr': 0.0004981767756580138, 'samples': 1477248, 'steps': 7693, 'loss/train': 1.7965588569641113} +11/06/2021 22:19:25 - INFO - __main__ - Step 7695: {'lr': 0.0004981761358673378, 'samples': 1477440, 'steps': 7694, 'loss/train': 2.0630042552948} +11/06/2021 22:19:26 - INFO - __main__ - Step 7696: {'lr': 0.0004981754959648376, 'samples': 1477632, 'steps': 7695, 'loss/train': 1.89278244972229} +11/06/2021 22:19:26 - INFO - __main__ - Step 7697: {'lr': 0.0004981748559505131, 'samples': 1477824, 'steps': 7696, 'loss/train': 1.7540265321731567} +11/06/2021 22:19:27 - INFO - __main__ - Step 7698: {'lr': 0.0004981742158243651, 'samples': 1478016, 'steps': 7697, 'loss/train': 1.4253634214401245} +11/06/2021 22:19:27 - INFO - __main__ - Step 7699: {'lr': 0.0004981735755863934, 'samples': 1478208, 'steps': 7698, 'loss/train': 2.059159517288208} +11/06/2021 22:19:28 - INFO - __main__ - Step 7700: {'lr': 0.0004981729352365986, 'samples': 1478400, 'steps': 7699, 'loss/train': 1.953817367553711} +11/06/2021 22:19:28 - INFO - __main__ - Step 7701: {'lr': 0.0004981722947749811, 'samples': 1478592, 'steps': 7700, 'loss/train': 1.9342195987701416} +11/06/2021 22:19:28 - INFO - __main__ - Step 7702: {'lr': 0.0004981716542015408, 'samples': 1478784, 'steps': 7701, 'loss/train': 1.841950535774231} +11/06/2021 22:19:29 - INFO - __main__ - Step 7703: {'lr': 0.0004981710135162781, 'samples': 1478976, 'steps': 7702, 'loss/train': 1.5683513879776} +11/06/2021 22:19:30 - INFO - __main__ - Step 7704: {'lr': 0.0004981703727191935, 'samples': 1479168, 'steps': 7703, 'loss/train': 1.7264535427093506} +11/06/2021 22:19:30 - INFO - __main__ - Step 7705: {'lr': 0.0004981697318102872, 'samples': 1479360, 'steps': 7704, 'loss/train': 2.026911973953247} +11/06/2021 22:19:31 - INFO - __main__ - Step 7706: {'lr': 0.0004981690907895594, 'samples': 1479552, 'steps': 7705, 'loss/train': 1.9870184659957886} +11/06/2021 22:19:31 - INFO - __main__ - Step 7707: {'lr': 0.0004981684496570104, 'samples': 1479744, 'steps': 7706, 'loss/train': 1.9878273010253906} +11/06/2021 22:19:31 - INFO - __main__ - Step 7708: {'lr': 0.0004981678084126405, 'samples': 1479936, 'steps': 7707, 'loss/train': 1.5540006160736084} +11/06/2021 22:19:32 - INFO - __main__ - Step 7709: {'lr': 0.0004981671670564502, 'samples': 1480128, 'steps': 7708, 'loss/train': 1.544403314590454} +11/06/2021 22:19:33 - INFO - __main__ - Step 7710: {'lr': 0.0004981665255884394, 'samples': 1480320, 'steps': 7709, 'loss/train': 2.273404598236084} +11/06/2021 22:19:33 - INFO - __main__ - Step 7711: {'lr': 0.0004981658840086087, 'samples': 1480512, 'steps': 7710, 'loss/train': 2.1462695598602295} +11/06/2021 22:19:33 - INFO - __main__ - Step 7712: {'lr': 0.0004981652423169582, 'samples': 1480704, 'steps': 7711, 'loss/train': 1.3098105192184448} +11/06/2021 22:19:34 - INFO - __main__ - Step 7713: {'lr': 0.0004981646005134884, 'samples': 1480896, 'steps': 7712, 'loss/train': 1.9249402284622192} +11/06/2021 22:19:35 - INFO - __main__ - Step 7714: {'lr': 0.0004981639585981993, 'samples': 1481088, 'steps': 7713, 'loss/train': 1.955265760421753} +11/06/2021 22:19:35 - INFO - __main__ - Step 7715: {'lr': 0.0004981633165710914, 'samples': 1481280, 'steps': 7714, 'loss/train': 2.254359722137451} +11/06/2021 22:19:35 - INFO - __main__ - Step 7716: {'lr': 0.000498162674432165, 'samples': 1481472, 'steps': 7715, 'loss/train': 1.0957801342010498} +11/06/2021 22:19:36 - INFO - __main__ - Step 7717: {'lr': 0.0004981620321814203, 'samples': 1481664, 'steps': 7716, 'loss/train': 1.9144853353500366} +11/06/2021 22:19:36 - INFO - __main__ - Step 7718: {'lr': 0.0004981613898188576, 'samples': 1481856, 'steps': 7717, 'loss/train': 1.7931559085845947} +11/06/2021 22:19:37 - INFO - __main__ - Step 7719: {'lr': 0.0004981607473444772, 'samples': 1482048, 'steps': 7718, 'loss/train': 1.8735288381576538} +11/06/2021 22:19:37 - INFO - __main__ - Step 7720: {'lr': 0.0004981601047582794, 'samples': 1482240, 'steps': 7719, 'loss/train': 1.727927327156067} +11/06/2021 22:19:38 - INFO - __main__ - Step 7721: {'lr': 0.0004981594620602645, 'samples': 1482432, 'steps': 7720, 'loss/train': 1.948897361755371} +11/06/2021 22:19:38 - INFO - __main__ - Step 7722: {'lr': 0.0004981588192504329, 'samples': 1482624, 'steps': 7721, 'loss/train': 0.8639780879020691} +11/06/2021 22:19:38 - INFO - __main__ - Step 7723: {'lr': 0.0004981581763287845, 'samples': 1482816, 'steps': 7722, 'loss/train': 2.073319673538208} +11/06/2021 22:19:39 - INFO - __main__ - Step 7724: {'lr': 0.0004981575332953201, 'samples': 1483008, 'steps': 7723, 'loss/train': 1.5656884908676147} +11/06/2021 22:19:40 - INFO - __main__ - Step 7725: {'lr': 0.0004981568901500396, 'samples': 1483200, 'steps': 7724, 'loss/train': 1.949126124382019} +11/06/2021 22:19:40 - INFO - __main__ - Step 7726: {'lr': 0.0004981562468929435, 'samples': 1483392, 'steps': 7725, 'loss/train': 2.107515811920166} +11/06/2021 22:19:40 - INFO - __main__ - Step 7727: {'lr': 0.000498155603524032, 'samples': 1483584, 'steps': 7726, 'loss/train': 1.8496572971343994} +11/06/2021 22:19:41 - INFO - __main__ - Step 7728: {'lr': 0.0004981549600433054, 'samples': 1483776, 'steps': 7727, 'loss/train': 2.109135627746582} +11/06/2021 22:19:42 - INFO - __main__ - Step 7729: {'lr': 0.000498154316450764, 'samples': 1483968, 'steps': 7728, 'loss/train': 1.3323477506637573} +11/06/2021 22:19:43 - INFO - __main__ - Step 7730: {'lr': 0.0004981536727464082, 'samples': 1484160, 'steps': 7729, 'loss/train': 1.855273962020874} +11/06/2021 22:19:43 - INFO - __main__ - Step 7731: {'lr': 0.0004981530289302381, 'samples': 1484352, 'steps': 7730, 'loss/train': 0.4355550706386566} +11/06/2021 22:19:43 - INFO - __main__ - Step 7732: {'lr': 0.000498152385002254, 'samples': 1484544, 'steps': 7731, 'loss/train': 2.0949268341064453} +11/06/2021 22:19:44 - INFO - __main__ - Step 7733: {'lr': 0.0004981517409624564, 'samples': 1484736, 'steps': 7732, 'loss/train': 2.226652145385742} +11/06/2021 22:19:44 - INFO - __main__ - Step 7734: {'lr': 0.0004981510968108453, 'samples': 1484928, 'steps': 7733, 'loss/train': 2.1331582069396973} +11/06/2021 22:19:45 - INFO - __main__ - Step 7735: {'lr': 0.0004981504525474214, 'samples': 1485120, 'steps': 7734, 'loss/train': 1.9985811710357666} +11/06/2021 22:19:45 - INFO - __main__ - Step 7736: {'lr': 0.0004981498081721845, 'samples': 1485312, 'steps': 7735, 'loss/train': 2.0506227016448975} +11/06/2021 22:19:46 - INFO - __main__ - Step 7737: {'lr': 0.0004981491636851351, 'samples': 1485504, 'steps': 7736, 'loss/train': 1.7922340631484985} +11/06/2021 22:19:46 - INFO - __main__ - Step 7738: {'lr': 0.0004981485190862737, 'samples': 1485696, 'steps': 7737, 'loss/train': 1.6075444221496582} +11/06/2021 22:19:46 - INFO - __main__ - Step 7739: {'lr': 0.0004981478743756004, 'samples': 1485888, 'steps': 7738, 'loss/train': 1.6328068971633911} +11/06/2021 22:19:47 - INFO - __main__ - Step 7740: {'lr': 0.0004981472295531153, 'samples': 1486080, 'steps': 7739, 'loss/train': 2.0658867359161377} +11/06/2021 22:19:48 - INFO - __main__ - Step 7741: {'lr': 0.000498146584618819, 'samples': 1486272, 'steps': 7740, 'loss/train': 2.0356781482696533} +11/06/2021 22:19:48 - INFO - __main__ - Step 7742: {'lr': 0.0004981459395727117, 'samples': 1486464, 'steps': 7741, 'loss/train': 2.1248600482940674} +11/06/2021 22:19:49 - INFO - __main__ - Step 7743: {'lr': 0.0004981452944147937, 'samples': 1486656, 'steps': 7742, 'loss/train': 2.0457077026367188} +11/06/2021 22:19:49 - INFO - __main__ - Step 7744: {'lr': 0.0004981446491450652, 'samples': 1486848, 'steps': 7743, 'loss/train': 2.0596790313720703} +11/06/2021 22:19:50 - INFO - __main__ - Step 7745: {'lr': 0.0004981440037635266, 'samples': 1487040, 'steps': 7744, 'loss/train': 1.76706862449646} +11/06/2021 22:19:50 - INFO - __main__ - Step 7746: {'lr': 0.0004981433582701781, 'samples': 1487232, 'steps': 7745, 'loss/train': 1.9943227767944336} +11/06/2021 22:19:51 - INFO - __main__ - Step 7747: {'lr': 0.00049814271266502, 'samples': 1487424, 'steps': 7746, 'loss/train': 1.9205338954925537} +11/06/2021 22:19:51 - INFO - __main__ - Step 7748: {'lr': 0.0004981420669480526, 'samples': 1487616, 'steps': 7747, 'loss/train': 1.346489667892456} +11/06/2021 22:19:51 - INFO - __main__ - Step 7749: {'lr': 0.0004981414211192763, 'samples': 1487808, 'steps': 7748, 'loss/train': 2.3146755695343018} +11/06/2021 22:19:52 - INFO - __main__ - Step 7750: {'lr': 0.0004981407751786913, 'samples': 1488000, 'steps': 7749, 'loss/train': 1.654209852218628} +11/06/2021 22:19:53 - INFO - __main__ - Step 7751: {'lr': 0.0004981401291262979, 'samples': 1488192, 'steps': 7750, 'loss/train': 0.34622922539711} +11/06/2021 22:19:53 - INFO - __main__ - Step 7752: {'lr': 0.0004981394829620963, 'samples': 1488384, 'steps': 7751, 'loss/train': 1.7355235815048218} +11/06/2021 22:19:53 - INFO - __main__ - Step 7753: {'lr': 0.0004981388366860869, 'samples': 1488576, 'steps': 7752, 'loss/train': 1.484642744064331} +11/06/2021 22:19:54 - INFO - __main__ - Step 7754: {'lr': 0.0004981381902982702, 'samples': 1488768, 'steps': 7753, 'loss/train': 1.2855114936828613} +11/06/2021 22:19:54 - INFO - __main__ - Step 7755: {'lr': 0.0004981375437986459, 'samples': 1488960, 'steps': 7754, 'loss/train': 1.6895129680633545} +11/06/2021 22:19:55 - INFO - __main__ - Step 7756: {'lr': 0.0004981368971872149, 'samples': 1489152, 'steps': 7755, 'loss/train': 1.9353357553482056} +11/06/2021 22:19:55 - INFO - __main__ - Step 7757: {'lr': 0.0004981362504639772, 'samples': 1489344, 'steps': 7756, 'loss/train': 1.9244894981384277} +11/06/2021 22:19:56 - INFO - __main__ - Step 7758: {'lr': 0.0004981356036289331, 'samples': 1489536, 'steps': 7757, 'loss/train': 1.332854151725769} +11/06/2021 22:19:56 - INFO - __main__ - Step 7759: {'lr': 0.0004981349566820828, 'samples': 1489728, 'steps': 7758, 'loss/train': 1.9951647520065308} +11/06/2021 22:19:57 - INFO - __main__ - Step 7760: {'lr': 0.0004981343096234268, 'samples': 1489920, 'steps': 7759, 'loss/train': 1.7065505981445312} +11/06/2021 22:19:58 - INFO - __main__ - Step 7761: {'lr': 0.0004981336624529654, 'samples': 1490112, 'steps': 7760, 'loss/train': 1.5033037662506104} +11/06/2021 22:19:58 - INFO - __main__ - Step 7762: {'lr': 0.0004981330151706988, 'samples': 1490304, 'steps': 7761, 'loss/train': 1.2406482696533203} +11/06/2021 22:19:58 - INFO - __main__ - Step 7763: {'lr': 0.0004981323677766273, 'samples': 1490496, 'steps': 7762, 'loss/train': 2.313772678375244} +11/06/2021 22:19:59 - INFO - __main__ - Step 7764: {'lr': 0.000498131720270751, 'samples': 1490688, 'steps': 7763, 'loss/train': 1.9050623178482056} +11/06/2021 22:19:59 - INFO - __main__ - Step 7765: {'lr': 0.0004981310726530706, 'samples': 1490880, 'steps': 7764, 'loss/train': 1.5810691118240356} +11/06/2021 22:20:00 - INFO - __main__ - Step 7766: {'lr': 0.0004981304249235861, 'samples': 1491072, 'steps': 7765, 'loss/train': 1.6522554159164429} +11/06/2021 22:20:00 - INFO - __main__ - Step 7767: {'lr': 0.0004981297770822977, 'samples': 1491264, 'steps': 7766, 'loss/train': 2.1629531383514404} +11/06/2021 22:20:01 - INFO - __main__ - Step 7768: {'lr': 0.0004981291291292061, 'samples': 1491456, 'steps': 7767, 'loss/train': 2.0148024559020996} +11/06/2021 22:20:01 - INFO - __main__ - Step 7769: {'lr': 0.0004981284810643112, 'samples': 1491648, 'steps': 7768, 'loss/train': 1.8133976459503174} +11/06/2021 22:20:01 - INFO - __main__ - Step 7770: {'lr': 0.0004981278328876134, 'samples': 1491840, 'steps': 7769, 'loss/train': 1.844529151916504} +11/06/2021 22:20:02 - INFO - __main__ - Step 7771: {'lr': 0.0004981271845991131, 'samples': 1492032, 'steps': 7770, 'loss/train': 1.6602436304092407} +11/06/2021 22:20:03 - INFO - __main__ - Step 7772: {'lr': 0.0004981265361988105, 'samples': 1492224, 'steps': 7771, 'loss/train': 1.7457406520843506} +11/06/2021 22:20:03 - INFO - __main__ - Step 7773: {'lr': 0.000498125887686706, 'samples': 1492416, 'steps': 7772, 'loss/train': 1.8187391757965088} +11/06/2021 22:20:03 - INFO - __main__ - Step 7774: {'lr': 0.0004981252390627997, 'samples': 1492608, 'steps': 7773, 'loss/train': 2.382383108139038} +11/06/2021 22:20:04 - INFO - __main__ - Step 7775: {'lr': 0.000498124590327092, 'samples': 1492800, 'steps': 7774, 'loss/train': 2.054161310195923} +11/06/2021 22:20:05 - INFO - __main__ - Step 7776: {'lr': 0.0004981239414795832, 'samples': 1492992, 'steps': 7775, 'loss/train': 1.5990222692489624} +11/06/2021 22:20:05 - INFO - __main__ - Step 7777: {'lr': 0.0004981232925202736, 'samples': 1493184, 'steps': 7776, 'loss/train': 1.856432318687439} +11/06/2021 22:20:06 - INFO - __main__ - Step 7778: {'lr': 0.0004981226434491635, 'samples': 1493376, 'steps': 7777, 'loss/train': 1.7675282955169678} +11/06/2021 22:20:06 - INFO - __main__ - Step 7779: {'lr': 0.000498121994266253, 'samples': 1493568, 'steps': 7778, 'loss/train': 1.9787876605987549} +11/06/2021 22:20:07 - INFO - __main__ - Step 7780: {'lr': 0.0004981213449715427, 'samples': 1493760, 'steps': 7779, 'loss/train': 2.1368026733398438} +11/06/2021 22:20:07 - INFO - __main__ - Step 7781: {'lr': 0.0004981206955650328, 'samples': 1493952, 'steps': 7780, 'loss/train': 1.7741491794586182} +11/06/2021 22:20:08 - INFO - __main__ - Step 7782: {'lr': 0.0004981200460467234, 'samples': 1494144, 'steps': 7781, 'loss/train': 1.8448156118392944} +11/06/2021 22:20:08 - INFO - __main__ - Step 7783: {'lr': 0.0004981193964166151, 'samples': 1494336, 'steps': 7782, 'loss/train': 2.476020097732544} +11/06/2021 22:20:09 - INFO - __main__ - Step 7784: {'lr': 0.0004981187466747079, 'samples': 1494528, 'steps': 7783, 'loss/train': 1.604864478111267} +11/06/2021 22:20:09 - INFO - __main__ - Step 7785: {'lr': 0.0004981180968210023, 'samples': 1494720, 'steps': 7784, 'loss/train': 1.6935956478118896} +11/06/2021 22:20:09 - INFO - __main__ - Step 7786: {'lr': 0.0004981174468554984, 'samples': 1494912, 'steps': 7785, 'loss/train': 1.7149159908294678} +11/06/2021 22:20:10 - INFO - __main__ - Step 7787: {'lr': 0.0004981167967781968, 'samples': 1495104, 'steps': 7786, 'loss/train': 1.5972424745559692} +11/06/2021 22:20:11 - INFO - __main__ - Step 7788: {'lr': 0.0004981161465890975, 'samples': 1495296, 'steps': 7787, 'loss/train': 1.8924384117126465} +11/06/2021 22:20:11 - INFO - __main__ - Step 7789: {'lr': 0.0004981154962882008, 'samples': 1495488, 'steps': 7788, 'loss/train': 2.01082444190979} +11/06/2021 22:20:11 - INFO - __main__ - Step 7790: {'lr': 0.0004981148458755071, 'samples': 1495680, 'steps': 7789, 'loss/train': 2.0022146701812744} +11/06/2021 22:20:12 - INFO - __main__ - Step 7791: {'lr': 0.0004981141953510169, 'samples': 1495872, 'steps': 7790, 'loss/train': 1.9454317092895508} +11/06/2021 22:20:13 - INFO - __main__ - Step 7792: {'lr': 0.00049811354471473, 'samples': 1496064, 'steps': 7791, 'loss/train': 1.6417571306228638} +11/06/2021 22:20:13 - INFO - __main__ - Step 7793: {'lr': 0.0004981128939666471, 'samples': 1496256, 'steps': 7792, 'loss/train': 2.925060510635376} +11/06/2021 22:20:13 - INFO - __main__ - Step 7794: {'lr': 0.0004981122431067683, 'samples': 1496448, 'steps': 7793, 'loss/train': 2.0619399547576904} +11/06/2021 22:20:14 - INFO - __main__ - Step 7795: {'lr': 0.0004981115921350941, 'samples': 1496640, 'steps': 7794, 'loss/train': 1.3753095865249634} +11/06/2021 22:20:14 - INFO - __main__ - Step 7796: {'lr': 0.0004981109410516245, 'samples': 1496832, 'steps': 7795, 'loss/train': 1.4551738500595093} +11/06/2021 22:20:15 - INFO - __main__ - Step 7797: {'lr': 0.00049811028985636, 'samples': 1497024, 'steps': 7796, 'loss/train': 2.0298280715942383} +11/06/2021 22:20:15 - INFO - __main__ - Step 7798: {'lr': 0.0004981096385493007, 'samples': 1497216, 'steps': 7797, 'loss/train': 1.5669386386871338} +11/06/2021 22:20:16 - INFO - __main__ - Step 7799: {'lr': 0.0004981089871304472, 'samples': 1497408, 'steps': 7798, 'loss/train': 1.8886076211929321} +11/06/2021 22:20:16 - INFO - __main__ - Step 7800: {'lr': 0.0004981083355997995, 'samples': 1497600, 'steps': 7799, 'loss/train': 2.574296236038208} +11/06/2021 22:20:16 - INFO - __main__ - Step 7801: {'lr': 0.0004981076839573581, 'samples': 1497792, 'steps': 7800, 'loss/train': 0.9300814867019653} +11/06/2021 22:20:18 - INFO - __main__ - Step 7802: {'lr': 0.0004981070322031231, 'samples': 1497984, 'steps': 7801, 'loss/train': 1.7975281476974487} +11/06/2021 22:20:18 - INFO - __main__ - Step 7803: {'lr': 0.000498106380337095, 'samples': 1498176, 'steps': 7802, 'loss/train': 1.889115810394287} +11/06/2021 22:20:18 - INFO - __main__ - Step 7804: {'lr': 0.000498105728359274, 'samples': 1498368, 'steps': 7803, 'loss/train': 1.7939035892486572} +11/06/2021 22:20:19 - INFO - __main__ - Step 7805: {'lr': 0.0004981050762696604, 'samples': 1498560, 'steps': 7804, 'loss/train': 0.8266537189483643} +11/06/2021 22:20:19 - INFO - __main__ - Step 7806: {'lr': 0.0004981044240682544, 'samples': 1498752, 'steps': 7805, 'loss/train': 1.2602494955062866} +11/06/2021 22:20:19 - INFO - __main__ - Step 7807: {'lr': 0.0004981037717550564, 'samples': 1498944, 'steps': 7806, 'loss/train': 1.8031574487686157} +11/06/2021 22:20:20 - INFO - __main__ - Step 7808: {'lr': 0.0004981031193300667, 'samples': 1499136, 'steps': 7807, 'loss/train': 1.0529712438583374} +11/06/2021 22:20:21 - INFO - __main__ - Step 7809: {'lr': 0.0004981024667932855, 'samples': 1499328, 'steps': 7808, 'loss/train': 2.0406086444854736} +11/06/2021 22:20:21 - INFO - __main__ - Step 7810: {'lr': 0.0004981018141447133, 'samples': 1499520, 'steps': 7809, 'loss/train': 2.1355226039886475} +11/06/2021 22:20:21 - INFO - __main__ - Step 7811: {'lr': 0.00049810116138435, 'samples': 1499712, 'steps': 7810, 'loss/train': 1.709943413734436} +11/06/2021 22:20:22 - INFO - __main__ - Step 7812: {'lr': 0.0004981005085121963, 'samples': 1499904, 'steps': 7811, 'loss/train': 2.1915555000305176} +11/06/2021 22:20:23 - INFO - __main__ - Step 7813: {'lr': 0.0004980998555282524, 'samples': 1500096, 'steps': 7812, 'loss/train': 1.9955559968948364} +11/06/2021 22:20:23 - INFO - __main__ - Step 7814: {'lr': 0.0004980992024325185, 'samples': 1500288, 'steps': 7813, 'loss/train': 1.8444761037826538} +11/06/2021 22:20:24 - INFO - __main__ - Step 7815: {'lr': 0.0004980985492249949, 'samples': 1500480, 'steps': 7814, 'loss/train': 1.2955152988433838} +11/06/2021 22:20:24 - INFO - __main__ - Step 7816: {'lr': 0.0004980978959056819, 'samples': 1500672, 'steps': 7815, 'loss/train': 2.804755926132202} +11/06/2021 22:20:24 - INFO - __main__ - Step 7817: {'lr': 0.0004980972424745798, 'samples': 1500864, 'steps': 7816, 'loss/train': 2.022976875305176} +11/06/2021 22:20:26 - INFO - __main__ - Step 7818: {'lr': 0.000498096588931689, 'samples': 1501056, 'steps': 7817, 'loss/train': 1.9922711849212646} +11/06/2021 22:20:26 - INFO - __main__ - Step 7819: {'lr': 0.0004980959352770095, 'samples': 1501248, 'steps': 7818, 'loss/train': 2.2206287384033203} +11/06/2021 22:20:27 - INFO - __main__ - Step 7820: {'lr': 0.000498095281510542, 'samples': 1501440, 'steps': 7819, 'loss/train': 2.107832908630371} +11/06/2021 22:20:27 - INFO - __main__ - Step 7821: {'lr': 0.0004980946276322866, 'samples': 1501632, 'steps': 7820, 'loss/train': 2.020620822906494} +11/06/2021 22:20:27 - INFO - __main__ - Step 7822: {'lr': 0.0004980939736422436, 'samples': 1501824, 'steps': 7821, 'loss/train': 1.574951410293579} +11/06/2021 22:20:28 - INFO - __main__ - Step 7823: {'lr': 0.0004980933195404131, 'samples': 1502016, 'steps': 7822, 'loss/train': 1.5748287439346313} +11/06/2021 22:20:29 - INFO - __main__ - Step 7824: {'lr': 0.0004980926653267957, 'samples': 1502208, 'steps': 7823, 'loss/train': 2.000244617462158} +11/06/2021 22:20:29 - INFO - __main__ - Step 7825: {'lr': 0.0004980920110013915, 'samples': 1502400, 'steps': 7824, 'loss/train': 1.830479383468628} +11/06/2021 22:20:29 - INFO - __main__ - Step 7826: {'lr': 0.000498091356564201, 'samples': 1502592, 'steps': 7825, 'loss/train': 2.059532880783081} +11/06/2021 22:20:30 - INFO - __main__ - Step 7827: {'lr': 0.0004980907020152242, 'samples': 1502784, 'steps': 7826, 'loss/train': 2.0572545528411865} +11/06/2021 22:20:30 - INFO - __main__ - Step 7828: {'lr': 0.0004980900473544617, 'samples': 1502976, 'steps': 7827, 'loss/train': 1.7238388061523438} +11/06/2021 22:20:31 - INFO - __main__ - Step 7829: {'lr': 0.0004980893925819137, 'samples': 1503168, 'steps': 7828, 'loss/train': 1.9951441287994385} +11/06/2021 22:20:31 - INFO - __main__ - Step 7830: {'lr': 0.0004980887376975804, 'samples': 1503360, 'steps': 7829, 'loss/train': 1.7326819896697998} +11/06/2021 22:20:32 - INFO - __main__ - Step 7831: {'lr': 0.000498088082701462, 'samples': 1503552, 'steps': 7830, 'loss/train': 2.2184314727783203} +11/06/2021 22:20:32 - INFO - __main__ - Step 7832: {'lr': 0.0004980874275935591, 'samples': 1503744, 'steps': 7831, 'loss/train': 0.8481667041778564} +11/06/2021 22:20:32 - INFO - __main__ - Step 7833: {'lr': 0.0004980867723738717, 'samples': 1503936, 'steps': 7832, 'loss/train': 1.9760394096374512} +11/06/2021 22:20:34 - INFO - __main__ - Step 7834: {'lr': 0.0004980861170424003, 'samples': 1504128, 'steps': 7833, 'loss/train': 2.106902837753296} +11/06/2021 22:20:34 - INFO - __main__ - Step 7835: {'lr': 0.0004980854615991452, 'samples': 1504320, 'steps': 7834, 'loss/train': 2.3520045280456543} +11/06/2021 22:20:34 - INFO - __main__ - Step 7836: {'lr': 0.0004980848060441064, 'samples': 1504512, 'steps': 7835, 'loss/train': 2.106365442276001} +11/06/2021 22:20:35 - INFO - __main__ - Step 7837: {'lr': 0.0004980841503772846, 'samples': 1504704, 'steps': 7836, 'loss/train': 1.764209270477295} +11/06/2021 22:20:35 - INFO - __main__ - Step 7838: {'lr': 0.0004980834945986799, 'samples': 1504896, 'steps': 7837, 'loss/train': 2.0532870292663574} +11/06/2021 22:20:37 - INFO - __main__ - Step 7839: {'lr': 0.0004980828387082925, 'samples': 1505088, 'steps': 7838, 'loss/train': 2.207231283187866} +11/06/2021 22:20:37 - INFO - __main__ - Step 7840: {'lr': 0.000498082182706123, 'samples': 1505280, 'steps': 7839, 'loss/train': 0.6530503034591675} +11/06/2021 22:20:37 - INFO - __main__ - Step 7841: {'lr': 0.0004980815265921713, 'samples': 1505472, 'steps': 7840, 'loss/train': 0.6378718614578247} +11/06/2021 22:20:38 - INFO - __main__ - Step 7842: {'lr': 0.000498080870366438, 'samples': 1505664, 'steps': 7841, 'loss/train': 1.529860258102417} +11/06/2021 22:20:38 - INFO - __main__ - Step 7843: {'lr': 0.0004980802140289232, 'samples': 1505856, 'steps': 7842, 'loss/train': 1.2913402318954468} +11/06/2021 22:20:39 - INFO - __main__ - Step 7844: {'lr': 0.0004980795575796273, 'samples': 1506048, 'steps': 7843, 'loss/train': 1.243632435798645} +11/06/2021 22:20:39 - INFO - __main__ - Step 7845: {'lr': 0.0004980789010185507, 'samples': 1506240, 'steps': 7844, 'loss/train': 1.593994379043579} +11/06/2021 22:20:40 - INFO - __main__ - Step 7846: {'lr': 0.0004980782443456935, 'samples': 1506432, 'steps': 7845, 'loss/train': 1.4024707078933716} +11/06/2021 22:20:40 - INFO - __main__ - Step 7847: {'lr': 0.000498077587561056, 'samples': 1506624, 'steps': 7846, 'loss/train': 1.6562167406082153} +11/06/2021 22:20:40 - INFO - __main__ - Step 7848: {'lr': 0.0004980769306646386, 'samples': 1506816, 'steps': 7847, 'loss/train': 1.7106425762176514} +11/06/2021 22:20:41 - INFO - __main__ - Step 7849: {'lr': 0.0004980762736564417, 'samples': 1507008, 'steps': 7848, 'loss/train': 2.013291358947754} +11/06/2021 22:20:42 - INFO - __main__ - Step 7850: {'lr': 0.0004980756165364653, 'samples': 1507200, 'steps': 7849, 'loss/train': 2.613538980484009} +11/06/2021 22:20:42 - INFO - __main__ - Step 7851: {'lr': 0.0004980749593047099, 'samples': 1507392, 'steps': 7850, 'loss/train': 1.5560020208358765} +11/06/2021 22:20:43 - INFO - __main__ - Step 7852: {'lr': 0.0004980743019611757, 'samples': 1507584, 'steps': 7851, 'loss/train': 1.659212589263916} +11/06/2021 22:20:43 - INFO - __main__ - Step 7853: {'lr': 0.0004980736445058631, 'samples': 1507776, 'steps': 7852, 'loss/train': 1.3701859712600708} +11/06/2021 22:20:43 - INFO - __main__ - Step 7854: {'lr': 0.0004980729869387724, 'samples': 1507968, 'steps': 7853, 'loss/train': 1.2803887128829956} +11/06/2021 22:20:44 - INFO - __main__ - Step 7855: {'lr': 0.0004980723292599037, 'samples': 1508160, 'steps': 7854, 'loss/train': 1.8908063173294067} +11/06/2021 22:20:45 - INFO - __main__ - Step 7856: {'lr': 0.0004980716714692576, 'samples': 1508352, 'steps': 7855, 'loss/train': 1.353319764137268} +11/06/2021 22:20:45 - INFO - __main__ - Step 7857: {'lr': 0.0004980710135668342, 'samples': 1508544, 'steps': 7856, 'loss/train': 1.9040857553482056} +11/06/2021 22:20:45 - INFO - __main__ - Step 7858: {'lr': 0.0004980703555526338, 'samples': 1508736, 'steps': 7857, 'loss/train': 1.8307812213897705} +11/06/2021 22:20:46 - INFO - __main__ - Step 7859: {'lr': 0.0004980696974266566, 'samples': 1508928, 'steps': 7858, 'loss/train': 1.9307920932769775} +11/06/2021 22:20:47 - INFO - __main__ - Step 7860: {'lr': 0.0004980690391889033, 'samples': 1509120, 'steps': 7859, 'loss/train': 1.5426441431045532} +11/06/2021 22:20:47 - INFO - __main__ - Step 7861: {'lr': 0.0004980683808393737, 'samples': 1509312, 'steps': 7860, 'loss/train': 2.0717623233795166} +11/06/2021 22:20:48 - INFO - __main__ - Step 7862: {'lr': 0.0004980677223780683, 'samples': 1509504, 'steps': 7861, 'loss/train': 1.8097648620605469} +11/06/2021 22:20:48 - INFO - __main__ - Step 7863: {'lr': 0.0004980670638049875, 'samples': 1509696, 'steps': 7862, 'loss/train': 2.1986732482910156} +11/06/2021 22:20:48 - INFO - __main__ - Step 7864: {'lr': 0.0004980664051201315, 'samples': 1509888, 'steps': 7863, 'loss/train': 1.8978809118270874} +11/06/2021 22:20:49 - INFO - __main__ - Step 7865: {'lr': 0.0004980657463235006, 'samples': 1510080, 'steps': 7864, 'loss/train': 2.399979829788208} +11/06/2021 22:20:50 - INFO - __main__ - Step 7866: {'lr': 0.0004980650874150951, 'samples': 1510272, 'steps': 7865, 'loss/train': 2.042692184448242} +11/06/2021 22:20:50 - INFO - __main__ - Step 7867: {'lr': 0.0004980644283949152, 'samples': 1510464, 'steps': 7866, 'loss/train': 1.8365942239761353} +11/06/2021 22:20:50 - INFO - __main__ - Step 7868: {'lr': 0.0004980637692629615, 'samples': 1510656, 'steps': 7867, 'loss/train': 1.6458255052566528} +11/06/2021 22:20:51 - INFO - __main__ - Step 7869: {'lr': 0.0004980631100192339, 'samples': 1510848, 'steps': 7868, 'loss/train': 1.41680908203125} +11/06/2021 22:20:52 - INFO - __main__ - Step 7870: {'lr': 0.000498062450663733, 'samples': 1511040, 'steps': 7869, 'loss/train': 1.9412450790405273} +11/06/2021 22:20:53 - INFO - __main__ - Step 7871: {'lr': 0.000498061791196459, 'samples': 1511232, 'steps': 7870, 'loss/train': 1.4640387296676636} +11/06/2021 22:20:53 - INFO - __main__ - Step 7872: {'lr': 0.0004980611316174122, 'samples': 1511424, 'steps': 7871, 'loss/train': 1.4650890827178955} +11/06/2021 22:20:53 - INFO - __main__ - Step 7873: {'lr': 0.0004980604719265928, 'samples': 1511616, 'steps': 7872, 'loss/train': 1.9281331300735474} +11/06/2021 22:20:54 - INFO - __main__ - Step 7874: {'lr': 0.0004980598121240012, 'samples': 1511808, 'steps': 7873, 'loss/train': 1.7270317077636719} +11/06/2021 22:20:54 - INFO - __main__ - Step 7875: {'lr': 0.0004980591522096377, 'samples': 1512000, 'steps': 7874, 'loss/train': 3.885760545730591} +11/06/2021 22:20:55 - INFO - __main__ - Step 7876: {'lr': 0.0004980584921835025, 'samples': 1512192, 'steps': 7875, 'loss/train': 1.878515362739563} +11/06/2021 22:20:56 - INFO - __main__ - Step 7877: {'lr': 0.000498057832045596, 'samples': 1512384, 'steps': 7876, 'loss/train': 2.0955753326416016} +11/06/2021 22:20:56 - INFO - __main__ - Step 7878: {'lr': 0.0004980571717959186, 'samples': 1512576, 'steps': 7877, 'loss/train': 1.7663307189941406} +11/06/2021 22:20:56 - INFO - __main__ - Step 7879: {'lr': 0.0004980565114344704, 'samples': 1512768, 'steps': 7878, 'loss/train': 2.003199577331543} +11/06/2021 22:20:57 - INFO - __main__ - Step 7880: {'lr': 0.0004980558509612516, 'samples': 1512960, 'steps': 7879, 'loss/train': 1.4468077421188354} +11/06/2021 22:20:58 - INFO - __main__ - Step 7881: {'lr': 0.0004980551903762629, 'samples': 1513152, 'steps': 7880, 'loss/train': 1.9286073446273804} +11/06/2021 22:20:58 - INFO - __main__ - Step 7882: {'lr': 0.0004980545296795043, 'samples': 1513344, 'steps': 7881, 'loss/train': 1.9439208507537842} +11/06/2021 22:20:58 - INFO - __main__ - Step 7883: {'lr': 0.0004980538688709761, 'samples': 1513536, 'steps': 7882, 'loss/train': 1.9707108736038208} +11/06/2021 22:20:59 - INFO - __main__ - Step 7884: {'lr': 0.0004980532079506786, 'samples': 1513728, 'steps': 7883, 'loss/train': 2.4057676792144775} +11/06/2021 22:20:59 - INFO - __main__ - Step 7885: {'lr': 0.0004980525469186122, 'samples': 1513920, 'steps': 7884, 'loss/train': 2.0141124725341797} +11/06/2021 22:20:59 - INFO - __main__ - Step 7886: {'lr': 0.0004980518857747772, 'samples': 1514112, 'steps': 7885, 'loss/train': 1.6964260339736938} +11/06/2021 22:21:00 - INFO - __main__ - Step 7887: {'lr': 0.0004980512245191738, 'samples': 1514304, 'steps': 7886, 'loss/train': 2.2796289920806885} +11/06/2021 22:21:01 - INFO - __main__ - Step 7888: {'lr': 0.0004980505631518023, 'samples': 1514496, 'steps': 7887, 'loss/train': 1.9760662317276} +11/06/2021 22:21:01 - INFO - __main__ - Step 7889: {'lr': 0.0004980499016726632, 'samples': 1514688, 'steps': 7888, 'loss/train': 1.9461336135864258} +11/06/2021 22:21:01 - INFO - __main__ - Step 7890: {'lr': 0.0004980492400817564, 'samples': 1514880, 'steps': 7889, 'loss/train': 1.913292407989502} +11/06/2021 22:21:02 - INFO - __main__ - Step 7891: {'lr': 0.0004980485783790827, 'samples': 1515072, 'steps': 7890, 'loss/train': 1.8750466108322144} +11/06/2021 22:21:03 - INFO - __main__ - Step 7892: {'lr': 0.0004980479165646419, 'samples': 1515264, 'steps': 7891, 'loss/train': 2.3821234703063965} +11/06/2021 22:21:04 - INFO - __main__ - Step 7893: {'lr': 0.0004980472546384347, 'samples': 1515456, 'steps': 7892, 'loss/train': 2.1186270713806152} +11/06/2021 22:21:04 - INFO - __main__ - Step 7894: {'lr': 0.0004980465926004613, 'samples': 1515648, 'steps': 7893, 'loss/train': 5.3973493576049805} +11/06/2021 22:21:04 - INFO - __main__ - Step 7895: {'lr': 0.0004980459304507218, 'samples': 1515840, 'steps': 7894, 'loss/train': 2.0702314376831055} +11/06/2021 22:21:05 - INFO - __main__ - Step 7896: {'lr': 0.0004980452681892166, 'samples': 1516032, 'steps': 7895, 'loss/train': 2.7855825424194336} +11/06/2021 22:21:05 - INFO - __main__ - Step 7897: {'lr': 0.0004980446058159461, 'samples': 1516224, 'steps': 7896, 'loss/train': 2.5757217407226562} +11/06/2021 22:21:06 - INFO - __main__ - Step 7898: {'lr': 0.0004980439433309106, 'samples': 1516416, 'steps': 7897, 'loss/train': 1.7188911437988281} +11/06/2021 22:21:06 - INFO - __main__ - Step 7899: {'lr': 0.0004980432807341102, 'samples': 1516608, 'steps': 7898, 'loss/train': 1.881008267402649} +11/06/2021 22:21:07 - INFO - __main__ - Step 7900: {'lr': 0.0004980426180255453, 'samples': 1516800, 'steps': 7899, 'loss/train': 2.025660514831543} +11/06/2021 22:21:07 - INFO - __main__ - Step 7901: {'lr': 0.0004980419552052163, 'samples': 1516992, 'steps': 7900, 'loss/train': 1.8244693279266357} +11/06/2021 22:21:07 - INFO - __main__ - Step 7902: {'lr': 0.0004980412922731234, 'samples': 1517184, 'steps': 7901, 'loss/train': 2.084381103515625} +11/06/2021 22:21:09 - INFO - __main__ - Step 7903: {'lr': 0.0004980406292292669, 'samples': 1517376, 'steps': 7902, 'loss/train': 1.546284556388855} +11/06/2021 22:21:09 - INFO - __main__ - Step 7904: {'lr': 0.0004980399660736472, 'samples': 1517568, 'steps': 7903, 'loss/train': 1.5335673093795776} +11/06/2021 22:21:09 - INFO - __main__ - Step 7905: {'lr': 0.0004980393028062646, 'samples': 1517760, 'steps': 7904, 'loss/train': 2.310431480407715} +11/06/2021 22:21:10 - INFO - __main__ - Step 7906: {'lr': 0.0004980386394271191, 'samples': 1517952, 'steps': 7905, 'loss/train': 1.9592478275299072} +11/06/2021 22:21:10 - INFO - __main__ - Step 7907: {'lr': 0.0004980379759362113, 'samples': 1518144, 'steps': 7906, 'loss/train': 2.000092029571533} +11/06/2021 22:21:11 - INFO - __main__ - Step 7908: {'lr': 0.0004980373123335414, 'samples': 1518336, 'steps': 7907, 'loss/train': 2.0210494995117188} +11/06/2021 22:21:11 - INFO - __main__ - Step 7909: {'lr': 0.0004980366486191098, 'samples': 1518528, 'steps': 7908, 'loss/train': 1.597767949104309} +11/06/2021 22:21:12 - INFO - __main__ - Step 7910: {'lr': 0.0004980359847929167, 'samples': 1518720, 'steps': 7909, 'loss/train': 1.6900368928909302} +11/06/2021 22:21:12 - INFO - __main__ - Step 7911: {'lr': 0.0004980353208549623, 'samples': 1518912, 'steps': 7910, 'loss/train': 2.016561508178711} +11/06/2021 22:21:12 - INFO - __main__ - Step 7912: {'lr': 0.0004980346568052471, 'samples': 1519104, 'steps': 7911, 'loss/train': 1.868909478187561} +11/06/2021 22:21:14 - INFO - __main__ - Step 7913: {'lr': 0.0004980339926437713, 'samples': 1519296, 'steps': 7912, 'loss/train': 1.8896089792251587} +11/06/2021 22:21:14 - INFO - __main__ - Step 7914: {'lr': 0.0004980333283705351, 'samples': 1519488, 'steps': 7913, 'loss/train': 1.9207043647766113} +11/06/2021 22:21:14 - INFO - __main__ - Step 7915: {'lr': 0.000498032663985539, 'samples': 1519680, 'steps': 7914, 'loss/train': 1.3756333589553833} +11/06/2021 22:21:15 - INFO - __main__ - Step 7916: {'lr': 0.0004980319994887833, 'samples': 1519872, 'steps': 7915, 'loss/train': 1.878954291343689} +11/06/2021 22:21:15 - INFO - __main__ - Step 7917: {'lr': 0.0004980313348802681, 'samples': 1520064, 'steps': 7916, 'loss/train': 2.100268602371216} +11/06/2021 22:21:15 - INFO - __main__ - Step 7918: {'lr': 0.0004980306701599938, 'samples': 1520256, 'steps': 7917, 'loss/train': 2.110107421875} +11/06/2021 22:21:17 - INFO - __main__ - Step 7919: {'lr': 0.0004980300053279607, 'samples': 1520448, 'steps': 7918, 'loss/train': 2.0678465366363525} +11/06/2021 22:21:17 - INFO - __main__ - Step 7920: {'lr': 0.0004980293403841693, 'samples': 1520640, 'steps': 7919, 'loss/train': 2.0250751972198486} +11/06/2021 22:21:17 - INFO - __main__ - Step 7921: {'lr': 0.0004980286753286195, 'samples': 1520832, 'steps': 7920, 'loss/train': 0.41942548751831055} +11/06/2021 22:21:18 - INFO - __main__ - Step 7922: {'lr': 0.0004980280101613119, 'samples': 1521024, 'steps': 7921, 'loss/train': 2.067695379257202} +11/06/2021 22:21:18 - INFO - __main__ - Step 7923: {'lr': 0.0004980273448822466, 'samples': 1521216, 'steps': 7922, 'loss/train': 1.7907764911651611} +11/06/2021 22:21:19 - INFO - __main__ - Step 7924: {'lr': 0.000498026679491424, 'samples': 1521408, 'steps': 7923, 'loss/train': 1.5925756692886353} +11/06/2021 22:21:20 - INFO - __main__ - Step 7925: {'lr': 0.0004980260139888445, 'samples': 1521600, 'steps': 7924, 'loss/train': 1.906895637512207} +11/06/2021 22:21:20 - INFO - __main__ - Step 7926: {'lr': 0.0004980253483745083, 'samples': 1521792, 'steps': 7925, 'loss/train': 1.7573232650756836} +11/06/2021 22:21:20 - INFO - __main__ - Step 7927: {'lr': 0.0004980246826484157, 'samples': 1521984, 'steps': 7926, 'loss/train': 1.8057146072387695} +11/06/2021 22:21:21 - INFO - __main__ - Step 7928: {'lr': 0.000498024016810567, 'samples': 1522176, 'steps': 7927, 'loss/train': 0.6858081221580505} +11/06/2021 22:21:22 - INFO - __main__ - Step 7929: {'lr': 0.0004980233508609625, 'samples': 1522368, 'steps': 7928, 'loss/train': 1.501013994216919} +11/06/2021 22:21:22 - INFO - __main__ - Step 7930: {'lr': 0.0004980226847996025, 'samples': 1522560, 'steps': 7929, 'loss/train': 1.761657476425171} +11/06/2021 22:21:23 - INFO - __main__ - Step 7931: {'lr': 0.0004980220186264874, 'samples': 1522752, 'steps': 7930, 'loss/train': 1.874160885810852} +11/06/2021 22:21:23 - INFO - __main__ - Step 7932: {'lr': 0.0004980213523416172, 'samples': 1522944, 'steps': 7931, 'loss/train': 2.012180805206299} +11/06/2021 22:21:23 - INFO - __main__ - Step 7933: {'lr': 0.0004980206859449926, 'samples': 1523136, 'steps': 7932, 'loss/train': 2.158865213394165} +11/06/2021 22:21:24 - INFO - __main__ - Step 7934: {'lr': 0.0004980200194366136, 'samples': 1523328, 'steps': 7933, 'loss/train': 1.6870510578155518} +11/06/2021 22:21:25 - INFO - __main__ - Step 7935: {'lr': 0.0004980193528164806, 'samples': 1523520, 'steps': 7934, 'loss/train': 1.3986356258392334} +11/06/2021 22:21:25 - INFO - __main__ - Step 7936: {'lr': 0.0004980186860845939, 'samples': 1523712, 'steps': 7935, 'loss/train': 2.1106855869293213} +11/06/2021 22:21:25 - INFO - __main__ - Step 7937: {'lr': 0.0004980180192409539, 'samples': 1523904, 'steps': 7936, 'loss/train': 1.40969979763031} +11/06/2021 22:21:26 - INFO - __main__ - Step 7938: {'lr': 0.0004980173522855608, 'samples': 1524096, 'steps': 7937, 'loss/train': 1.793459415435791} +11/06/2021 22:21:26 - INFO - __main__ - Step 7939: {'lr': 0.0004980166852184148, 'samples': 1524288, 'steps': 7938, 'loss/train': 1.5917954444885254} +11/06/2021 22:21:27 - INFO - __main__ - Step 7940: {'lr': 0.0004980160180395164, 'samples': 1524480, 'steps': 7939, 'loss/train': 1.0192344188690186} +11/06/2021 22:21:27 - INFO - __main__ - Step 7941: {'lr': 0.0004980153507488657, 'samples': 1524672, 'steps': 7940, 'loss/train': 1.7049601078033447} +11/06/2021 22:21:28 - INFO - __main__ - Step 7942: {'lr': 0.0004980146833464633, 'samples': 1524864, 'steps': 7941, 'loss/train': 1.757932424545288} +11/06/2021 22:21:28 - INFO - __main__ - Step 7943: {'lr': 0.0004980140158323092, 'samples': 1525056, 'steps': 7942, 'loss/train': 1.4568382501602173} +11/06/2021 22:21:29 - INFO - __main__ - Step 7944: {'lr': 0.0004980133482064038, 'samples': 1525248, 'steps': 7943, 'loss/train': 2.041997194290161} +11/06/2021 22:21:30 - INFO - __main__ - Step 7945: {'lr': 0.0004980126804687474, 'samples': 1525440, 'steps': 7944, 'loss/train': 1.5531878471374512} +11/06/2021 22:21:30 - INFO - __main__ - Step 7946: {'lr': 0.0004980120126193403, 'samples': 1525632, 'steps': 7945, 'loss/train': 1.8834867477416992} +11/06/2021 22:21:30 - INFO - __main__ - Step 7947: {'lr': 0.0004980113446581829, 'samples': 1525824, 'steps': 7946, 'loss/train': 1.9784860610961914} +11/06/2021 22:21:31 - INFO - __main__ - Step 7948: {'lr': 0.0004980106765852753, 'samples': 1526016, 'steps': 7947, 'loss/train': 1.549972653388977} +11/06/2021 22:21:31 - INFO - __main__ - Step 7949: {'lr': 0.0004980100084006181, 'samples': 1526208, 'steps': 7948, 'loss/train': 1.9199172258377075} +11/06/2021 22:21:32 - INFO - __main__ - Step 7950: {'lr': 0.0004980093401042113, 'samples': 1526400, 'steps': 7949, 'loss/train': 1.6837117671966553} +11/06/2021 22:21:32 - INFO - __main__ - Step 7951: {'lr': 0.0004980086716960552, 'samples': 1526592, 'steps': 7950, 'loss/train': 2.027440071105957} +11/06/2021 22:21:33 - INFO - __main__ - Step 7952: {'lr': 0.0004980080031761504, 'samples': 1526784, 'steps': 7951, 'loss/train': 1.549945592880249} +11/06/2021 22:21:33 - INFO - __main__ - Step 7953: {'lr': 0.000498007334544497, 'samples': 1526976, 'steps': 7952, 'loss/train': 2.5235583782196045} +11/06/2021 22:21:33 - INFO - __main__ - Step 7954: {'lr': 0.0004980066658010952, 'samples': 1527168, 'steps': 7953, 'loss/train': 1.8120335340499878} +11/06/2021 22:21:34 - INFO - __main__ - Step 7955: {'lr': 0.0004980059969459455, 'samples': 1527360, 'steps': 7954, 'loss/train': 1.7081891298294067} +11/06/2021 22:21:35 - INFO - __main__ - Step 7956: {'lr': 0.0004980053279790481, 'samples': 1527552, 'steps': 7955, 'loss/train': 1.0960886478424072} +11/06/2021 22:21:35 - INFO - __main__ - Step 7957: {'lr': 0.0004980046589004034, 'samples': 1527744, 'steps': 7956, 'loss/train': 1.416310429573059} +11/06/2021 22:21:35 - INFO - __main__ - Step 7958: {'lr': 0.0004980039897100115, 'samples': 1527936, 'steps': 7957, 'loss/train': 2.159583568572998} +11/06/2021 22:21:36 - INFO - __main__ - Step 7959: {'lr': 0.000498003320407873, 'samples': 1528128, 'steps': 7958, 'loss/train': 2.172380208969116} +11/06/2021 22:21:36 - INFO - __main__ - Step 7960: {'lr': 0.000498002650993988, 'samples': 1528320, 'steps': 7959, 'loss/train': 1.913335919380188} +11/06/2021 22:21:37 - INFO - __main__ - Step 7961: {'lr': 0.0004980019814683568, 'samples': 1528512, 'steps': 7960, 'loss/train': 1.8780403137207031} +11/06/2021 22:21:38 - INFO - __main__ - Step 7962: {'lr': 0.0004980013118309796, 'samples': 1528704, 'steps': 7961, 'loss/train': 1.8526026010513306} +11/06/2021 22:21:38 - INFO - __main__ - Step 7963: {'lr': 0.000498000642081857, 'samples': 1528896, 'steps': 7962, 'loss/train': 1.8182376623153687} +11/06/2021 22:21:38 - INFO - __main__ - Step 7964: {'lr': 0.0004979999722209891, 'samples': 1529088, 'steps': 7963, 'loss/train': 1.9147931337356567} +11/06/2021 22:21:39 - INFO - __main__ - Step 7965: {'lr': 0.0004979993022483762, 'samples': 1529280, 'steps': 7964, 'loss/train': 1.8008043766021729} +11/06/2021 22:21:40 - INFO - __main__ - Step 7966: {'lr': 0.0004979986321640187, 'samples': 1529472, 'steps': 7965, 'loss/train': 1.427006483078003} +11/06/2021 22:21:40 - INFO - __main__ - Step 7967: {'lr': 0.0004979979619679168, 'samples': 1529664, 'steps': 7966, 'loss/train': 1.8842092752456665} +11/06/2021 22:21:41 - INFO - __main__ - Step 7968: {'lr': 0.0004979972916600708, 'samples': 1529856, 'steps': 7967, 'loss/train': 2.3407888412475586} +11/06/2021 22:21:41 - INFO - __main__ - Step 7969: {'lr': 0.0004979966212404812, 'samples': 1530048, 'steps': 7968, 'loss/train': 1.6167200803756714} +11/06/2021 22:21:41 - INFO - __main__ - Step 7970: {'lr': 0.0004979959507091479, 'samples': 1530240, 'steps': 7969, 'loss/train': 1.8462982177734375} +11/06/2021 22:21:42 - INFO - __main__ - Step 7971: {'lr': 0.0004979952800660717, 'samples': 1530432, 'steps': 7970, 'loss/train': 2.2095303535461426} +11/06/2021 22:21:43 - INFO - __main__ - Step 7972: {'lr': 0.0004979946093112525, 'samples': 1530624, 'steps': 7971, 'loss/train': 2.2119836807250977} +11/06/2021 22:21:44 - INFO - __main__ - Step 7973: {'lr': 0.0004979939384446908, 'samples': 1530816, 'steps': 7972, 'loss/train': 1.7757575511932373} +11/06/2021 22:21:44 - INFO - __main__ - Step 7974: {'lr': 0.0004979932674663869, 'samples': 1531008, 'steps': 7973, 'loss/train': 1.04556405544281} +11/06/2021 22:21:44 - INFO - __main__ - Step 7975: {'lr': 0.000497992596376341, 'samples': 1531200, 'steps': 7974, 'loss/train': 1.6081430912017822} +11/06/2021 22:21:45 - INFO - __main__ - Step 7976: {'lr': 0.0004979919251745535, 'samples': 1531392, 'steps': 7975, 'loss/train': 2.162876844406128} +11/06/2021 22:21:46 - INFO - __main__ - Step 7977: {'lr': 0.0004979912538610247, 'samples': 1531584, 'steps': 7976, 'loss/train': 1.4090156555175781} +11/06/2021 22:21:46 - INFO - __main__ - Step 7978: {'lr': 0.0004979905824357548, 'samples': 1531776, 'steps': 7977, 'loss/train': 1.850123405456543} +11/06/2021 22:21:46 - INFO - __main__ - Step 7979: {'lr': 0.0004979899108987442, 'samples': 1531968, 'steps': 7978, 'loss/train': 2.130842685699463} +11/06/2021 22:21:47 - INFO - __main__ - Step 7980: {'lr': 0.0004979892392499932, 'samples': 1532160, 'steps': 7979, 'loss/train': 1.864031434059143} +11/06/2021 22:21:47 - INFO - __main__ - Step 7981: {'lr': 0.0004979885674895021, 'samples': 1532352, 'steps': 7980, 'loss/train': 1.6603336334228516} +11/06/2021 22:21:48 - INFO - __main__ - Step 7982: {'lr': 0.0004979878956172711, 'samples': 1532544, 'steps': 7981, 'loss/train': 1.4955323934555054} +11/06/2021 22:21:48 - INFO - __main__ - Step 7983: {'lr': 0.0004979872236333005, 'samples': 1532736, 'steps': 7982, 'loss/train': 2.017420530319214} +11/06/2021 22:21:49 - INFO - __main__ - Step 7984: {'lr': 0.0004979865515375908, 'samples': 1532928, 'steps': 7983, 'loss/train': 1.8274989128112793} +11/06/2021 22:21:49 - INFO - __main__ - Step 7985: {'lr': 0.0004979858793301422, 'samples': 1533120, 'steps': 7984, 'loss/train': 1.6632914543151855} +11/06/2021 22:21:49 - INFO - __main__ - Step 7986: {'lr': 0.000497985207010955, 'samples': 1533312, 'steps': 7985, 'loss/train': 1.2843949794769287} +11/06/2021 22:21:50 - INFO - __main__ - Step 7987: {'lr': 0.0004979845345800294, 'samples': 1533504, 'steps': 7986, 'loss/train': 1.5527995824813843} +11/06/2021 22:21:51 - INFO - __main__ - Step 7988: {'lr': 0.0004979838620373659, 'samples': 1533696, 'steps': 7987, 'loss/train': 1.7927266359329224} +11/06/2021 22:21:52 - INFO - __main__ - Step 7989: {'lr': 0.0004979831893829646, 'samples': 1533888, 'steps': 7988, 'loss/train': 0.755244791507721} +11/06/2021 22:21:52 - INFO - __main__ - Step 7990: {'lr': 0.0004979825166168259, 'samples': 1534080, 'steps': 7989, 'loss/train': 1.9054588079452515} +11/06/2021 22:21:52 - INFO - __main__ - Step 7991: {'lr': 0.0004979818437389502, 'samples': 1534272, 'steps': 7990, 'loss/train': 1.586555004119873} +11/06/2021 22:21:53 - INFO - __main__ - Step 7992: {'lr': 0.0004979811707493377, 'samples': 1534464, 'steps': 7991, 'loss/train': 2.3696506023406982} +11/06/2021 22:21:53 - INFO - __main__ - Step 7993: {'lr': 0.0004979804976479887, 'samples': 1534656, 'steps': 7992, 'loss/train': 2.9696648120880127} +11/06/2021 22:21:54 - INFO - __main__ - Step 7994: {'lr': 0.0004979798244349034, 'samples': 1534848, 'steps': 7993, 'loss/train': 0.5555250644683838} +11/06/2021 22:21:54 - INFO - __main__ - Step 7995: {'lr': 0.0004979791511100823, 'samples': 1535040, 'steps': 7994, 'loss/train': 2.1885805130004883} +11/06/2021 22:21:55 - INFO - __main__ - Step 7996: {'lr': 0.0004979784776735257, 'samples': 1535232, 'steps': 7995, 'loss/train': 2.107032060623169} +11/06/2021 22:21:55 - INFO - __main__ - Step 7997: {'lr': 0.0004979778041252338, 'samples': 1535424, 'steps': 7996, 'loss/train': 1.827415943145752} +11/06/2021 22:21:55 - INFO - __main__ - Step 7998: {'lr': 0.0004979771304652068, 'samples': 1535616, 'steps': 7997, 'loss/train': 1.842453122138977} +11/06/2021 22:21:56 - INFO - __main__ - Step 7999: {'lr': 0.0004979764566934452, 'samples': 1535808, 'steps': 7998, 'loss/train': 1.6808557510375977} +11/06/2021 22:21:57 - INFO - __main__ - Step 8000: {'lr': 0.0004979757828099492, 'samples': 1536000, 'steps': 7999, 'loss/train': 1.729453206062317} +11/06/2021 22:21:57 - INFO - __main__ - Step 8001: {'lr': 0.0004979751088147192, 'samples': 1536192, 'steps': 8000, 'loss/train': 1.9405218362808228} +11/06/2021 22:21:58 - INFO - __main__ - Step 8002: {'lr': 0.0004979744347077555, 'samples': 1536384, 'steps': 8001, 'loss/train': 1.666454553604126} +11/06/2021 22:21:58 - INFO - __main__ - Step 8003: {'lr': 0.0004979737604890582, 'samples': 1536576, 'steps': 8002, 'loss/train': 2.0916402339935303} +11/06/2021 22:22:00 - INFO - __main__ - Step 8004: {'lr': 0.0004979730861586278, 'samples': 1536768, 'steps': 8003, 'loss/train': 2.936959743499756} +11/06/2021 22:22:00 - INFO - __main__ - Step 8005: {'lr': 0.0004979724117164646, 'samples': 1536960, 'steps': 8004, 'loss/train': 2.1846797466278076} +11/06/2021 22:22:00 - INFO - __main__ - Step 8006: {'lr': 0.0004979717371625689, 'samples': 1537152, 'steps': 8005, 'loss/train': 1.4431344270706177} +11/06/2021 22:22:01 - INFO - __main__ - Step 8007: {'lr': 0.0004979710624969408, 'samples': 1537344, 'steps': 8006, 'loss/train': 1.6920371055603027} +11/06/2021 22:22:01 - INFO - __main__ - Step 8008: {'lr': 0.000497970387719581, 'samples': 1537536, 'steps': 8007, 'loss/train': 1.7911888360977173} +11/06/2021 22:22:01 - INFO - __main__ - Step 8009: {'lr': 0.0004979697128304893, 'samples': 1537728, 'steps': 8008, 'loss/train': 2.065598249435425} +11/06/2021 22:22:02 - INFO - __main__ - Step 8010: {'lr': 0.0004979690378296665, 'samples': 1537920, 'steps': 8009, 'loss/train': 1.9170726537704468} +11/06/2021 22:22:02 - INFO - __main__ - Step 8011: {'lr': 0.0004979683627171125, 'samples': 1538112, 'steps': 8010, 'loss/train': 2.038038730621338} +11/06/2021 22:22:03 - INFO - __main__ - Step 8012: {'lr': 0.0004979676874928278, 'samples': 1538304, 'steps': 8011, 'loss/train': 1.8985741138458252} +11/06/2021 22:22:04 - INFO - __main__ - Step 8013: {'lr': 0.0004979670121568129, 'samples': 1538496, 'steps': 8012, 'loss/train': 2.169818878173828} +11/06/2021 22:22:04 - INFO - __main__ - Step 8014: {'lr': 0.0004979663367090676, 'samples': 1538688, 'steps': 8013, 'loss/train': 2.037712335586548} +11/06/2021 22:22:04 - INFO - __main__ - Step 8015: {'lr': 0.0004979656611495927, 'samples': 1538880, 'steps': 8014, 'loss/train': 2.2237470149993896} +11/06/2021 22:22:05 - INFO - __main__ - Step 8016: {'lr': 0.0004979649854783883, 'samples': 1539072, 'steps': 8015, 'loss/train': 1.822688341140747} +11/06/2021 22:22:06 - INFO - __main__ - Step 8017: {'lr': 0.0004979643096954545, 'samples': 1539264, 'steps': 8016, 'loss/train': 2.502737283706665} +11/06/2021 22:22:06 - INFO - __main__ - Step 8018: {'lr': 0.000497963633800792, 'samples': 1539456, 'steps': 8017, 'loss/train': 1.937386393547058} +11/06/2021 22:22:06 - INFO - __main__ - Step 8019: {'lr': 0.0004979629577944009, 'samples': 1539648, 'steps': 8018, 'loss/train': 1.8304017782211304} +11/06/2021 22:22:07 - INFO - __main__ - Step 8020: {'lr': 0.0004979622816762815, 'samples': 1539840, 'steps': 8019, 'loss/train': 2.0212595462799072} +11/06/2021 22:22:07 - INFO - __main__ - Step 8021: {'lr': 0.0004979616054464341, 'samples': 1540032, 'steps': 8020, 'loss/train': 1.852665662765503} +11/06/2021 22:22:08 - INFO - __main__ - Step 8022: {'lr': 0.000497960929104859, 'samples': 1540224, 'steps': 8021, 'loss/train': 2.02396821975708} +11/06/2021 22:22:08 - INFO - __main__ - Step 8023: {'lr': 0.0004979602526515566, 'samples': 1540416, 'steps': 8022, 'loss/train': 2.089334726333618} +11/06/2021 22:22:09 - INFO - __main__ - Step 8024: {'lr': 0.0004979595760865271, 'samples': 1540608, 'steps': 8023, 'loss/train': 1.602588176727295} +11/06/2021 22:22:09 - INFO - __main__ - Step 8025: {'lr': 0.0004979588994097708, 'samples': 1540800, 'steps': 8024, 'loss/train': 1.3973878622055054} +11/06/2021 22:22:09 - INFO - __main__ - Step 8026: {'lr': 0.0004979582226212881, 'samples': 1540992, 'steps': 8025, 'loss/train': 1.1899759769439697} +11/06/2021 22:22:10 - INFO - __main__ - Step 8027: {'lr': 0.0004979575457210792, 'samples': 1541184, 'steps': 8026, 'loss/train': 1.6932975053787231} +11/06/2021 22:22:11 - INFO - __main__ - Step 8028: {'lr': 0.0004979568687091446, 'samples': 1541376, 'steps': 8027, 'loss/train': 1.7348906993865967} +11/06/2021 22:22:11 - INFO - __main__ - Step 8029: {'lr': 0.0004979561915854843, 'samples': 1541568, 'steps': 8028, 'loss/train': 1.5938066244125366} +11/06/2021 22:22:12 - INFO - __main__ - Step 8030: {'lr': 0.0004979555143500988, 'samples': 1541760, 'steps': 8029, 'loss/train': 2.0716259479522705} +11/06/2021 22:22:12 - INFO - __main__ - Step 8031: {'lr': 0.0004979548370029884, 'samples': 1541952, 'steps': 8030, 'loss/train': 1.7080976963043213} +11/06/2021 22:22:12 - INFO - __main__ - Step 8032: {'lr': 0.0004979541595441534, 'samples': 1542144, 'steps': 8031, 'loss/train': 1.9131830930709839} +11/06/2021 22:22:13 - INFO - __main__ - Step 8033: {'lr': 0.000497953481973594, 'samples': 1542336, 'steps': 8032, 'loss/train': 1.6197700500488281} +11/06/2021 22:22:14 - INFO - __main__ - Step 8034: {'lr': 0.0004979528042913106, 'samples': 1542528, 'steps': 8033, 'loss/train': 1.7297489643096924} +11/06/2021 22:22:14 - INFO - __main__ - Step 8035: {'lr': 0.0004979521264973036, 'samples': 1542720, 'steps': 8034, 'loss/train': 2.004364490509033} +11/06/2021 22:22:14 - INFO - __main__ - Step 8036: {'lr': 0.0004979514485915731, 'samples': 1542912, 'steps': 8035, 'loss/train': 1.4310439825057983} +11/06/2021 22:22:15 - INFO - __main__ - Step 8037: {'lr': 0.0004979507705741195, 'samples': 1543104, 'steps': 8036, 'loss/train': 1.9910510778427124} +11/06/2021 22:22:16 - INFO - __main__ - Step 8038: {'lr': 0.0004979500924449431, 'samples': 1543296, 'steps': 8037, 'loss/train': 1.46047043800354} +11/06/2021 22:22:16 - INFO - __main__ - Step 8039: {'lr': 0.0004979494142040444, 'samples': 1543488, 'steps': 8038, 'loss/train': 1.9380624294281006} +11/06/2021 22:22:16 - INFO - __main__ - Step 8040: {'lr': 0.0004979487358514233, 'samples': 1543680, 'steps': 8039, 'loss/train': 1.9118831157684326} +11/06/2021 22:22:17 - INFO - __main__ - Step 8041: {'lr': 0.0004979480573870803, 'samples': 1543872, 'steps': 8040, 'loss/train': 1.2592707872390747} +11/06/2021 22:22:17 - INFO - __main__ - Step 8042: {'lr': 0.000497947378811016, 'samples': 1544064, 'steps': 8041, 'loss/train': 2.1490068435668945} +11/06/2021 22:22:18 - INFO - __main__ - Step 8043: {'lr': 0.0004979467001232302, 'samples': 1544256, 'steps': 8042, 'loss/train': 1.6307603120803833} +11/06/2021 22:22:18 - INFO - __main__ - Step 8044: {'lr': 0.0004979460213237235, 'samples': 1544448, 'steps': 8043, 'loss/train': 1.8183969259262085} +11/06/2021 22:22:19 - INFO - __main__ - Step 8045: {'lr': 0.0004979453424124961, 'samples': 1544640, 'steps': 8044, 'loss/train': 1.2424389123916626} +11/06/2021 22:22:19 - INFO - __main__ - Step 8046: {'lr': 0.0004979446633895484, 'samples': 1544832, 'steps': 8045, 'loss/train': 1.352750301361084} +11/06/2021 22:22:20 - INFO - __main__ - Step 8047: {'lr': 0.0004979439842548808, 'samples': 1545024, 'steps': 8046, 'loss/train': 1.8693174123764038} +11/06/2021 22:22:20 - INFO - __main__ - Step 8048: {'lr': 0.0004979433050084933, 'samples': 1545216, 'steps': 8047, 'loss/train': 1.2310196161270142} +11/06/2021 22:22:21 - INFO - __main__ - Step 8049: {'lr': 0.0004979426256503863, 'samples': 1545408, 'steps': 8048, 'loss/train': 2.2753522396087646} +11/06/2021 22:22:21 - INFO - __main__ - Step 8050: {'lr': 0.0004979419461805603, 'samples': 1545600, 'steps': 8049, 'loss/train': 2.1069955825805664} +11/06/2021 22:22:22 - INFO - __main__ - Step 8051: {'lr': 0.0004979412665990156, 'samples': 1545792, 'steps': 8050, 'loss/train': 1.705078125} +11/06/2021 22:22:22 - INFO - __main__ - Step 8052: {'lr': 0.0004979405869057522, 'samples': 1545984, 'steps': 8051, 'loss/train': 1.9316350221633911} +11/06/2021 22:22:23 - INFO - __main__ - Step 8053: {'lr': 0.0004979399071007707, 'samples': 1546176, 'steps': 8052, 'loss/train': 2.099993944168091} +11/06/2021 22:22:23 - INFO - __main__ - Step 8054: {'lr': 0.0004979392271840712, 'samples': 1546368, 'steps': 8053, 'loss/train': 1.937470555305481} +11/06/2021 22:22:24 - INFO - __main__ - Step 8055: {'lr': 0.0004979385471556542, 'samples': 1546560, 'steps': 8054, 'loss/train': 2.03237247467041} +11/06/2021 22:22:24 - INFO - __main__ - Step 8056: {'lr': 0.00049793786701552, 'samples': 1546752, 'steps': 8055, 'loss/train': 1.7011387348175049} +11/06/2021 22:22:24 - INFO - __main__ - Step 8057: {'lr': 0.0004979371867636687, 'samples': 1546944, 'steps': 8056, 'loss/train': 1.647082805633545} +11/06/2021 22:22:25 - INFO - __main__ - Step 8058: {'lr': 0.0004979365064001007, 'samples': 1547136, 'steps': 8057, 'loss/train': 1.8520019054412842} +11/06/2021 22:22:26 - INFO - __main__ - Step 8059: {'lr': 0.0004979358259248164, 'samples': 1547328, 'steps': 8058, 'loss/train': 1.324270486831665} +11/06/2021 22:22:26 - INFO - __main__ - Step 8060: {'lr': 0.000497935145337816, 'samples': 1547520, 'steps': 8059, 'loss/train': 1.6463035345077515} +11/06/2021 22:22:27 - INFO - __main__ - Step 8061: {'lr': 0.0004979344646390999, 'samples': 1547712, 'steps': 8060, 'loss/train': 2.0036861896514893} +11/06/2021 22:22:27 - INFO - __main__ - Step 8062: {'lr': 0.0004979337838286684, 'samples': 1547904, 'steps': 8061, 'loss/train': 1.1817820072174072} +11/06/2021 22:22:27 - INFO - __main__ - Step 8063: {'lr': 0.0004979331029065216, 'samples': 1548096, 'steps': 8062, 'loss/train': 1.7082180976867676} +11/06/2021 22:22:28 - INFO - __main__ - Step 8064: {'lr': 0.00049793242187266, 'samples': 1548288, 'steps': 8063, 'loss/train': 1.778818964958191} +11/06/2021 22:22:29 - INFO - __main__ - Step 8065: {'lr': 0.000497931740727084, 'samples': 1548480, 'steps': 8064, 'loss/train': 6.108870983123779} +11/06/2021 22:22:29 - INFO - __main__ - Step 8066: {'lr': 0.0004979310594697937, 'samples': 1548672, 'steps': 8065, 'loss/train': 2.9927406311035156} +11/06/2021 22:22:30 - INFO - __main__ - Step 8067: {'lr': 0.0004979303781007896, 'samples': 1548864, 'steps': 8066, 'loss/train': 1.902443528175354} +11/06/2021 22:22:30 - INFO - __main__ - Step 8068: {'lr': 0.0004979296966200718, 'samples': 1549056, 'steps': 8067, 'loss/train': 1.7086400985717773} +11/06/2021 22:22:30 - INFO - __main__ - Step 8069: {'lr': 0.0004979290150276407, 'samples': 1549248, 'steps': 8068, 'loss/train': 1.9971203804016113} +11/06/2021 22:22:31 - INFO - __main__ - Step 8070: {'lr': 0.0004979283333234966, 'samples': 1549440, 'steps': 8069, 'loss/train': 1.9657219648361206} +11/06/2021 22:22:32 - INFO - __main__ - Step 8071: {'lr': 0.0004979276515076399, 'samples': 1549632, 'steps': 8070, 'loss/train': 1.041121482849121} +11/06/2021 22:22:32 - INFO - __main__ - Step 8072: {'lr': 0.0004979269695800707, 'samples': 1549824, 'steps': 8071, 'loss/train': 2.119021415710449} +11/06/2021 22:22:32 - INFO - __main__ - Step 8073: {'lr': 0.0004979262875407896, 'samples': 1550016, 'steps': 8072, 'loss/train': 1.3283685445785522} +11/06/2021 22:22:33 - INFO - __main__ - Step 8074: {'lr': 0.0004979256053897966, 'samples': 1550208, 'steps': 8073, 'loss/train': 2.044589042663574} +11/06/2021 22:22:35 - INFO - __main__ - Step 8075: {'lr': 0.0004979249231270923, 'samples': 1550400, 'steps': 8074, 'loss/train': 1.9413076639175415} +11/06/2021 22:22:35 - INFO - __main__ - Step 8076: {'lr': 0.0004979242407526766, 'samples': 1550592, 'steps': 8075, 'loss/train': 1.5758004188537598} +11/06/2021 22:22:35 - INFO - __main__ - Step 8077: {'lr': 0.0004979235582665503, 'samples': 1550784, 'steps': 8076, 'loss/train': 2.4612207412719727} +11/06/2021 22:22:36 - INFO - __main__ - Step 8078: {'lr': 0.0004979228756687135, 'samples': 1550976, 'steps': 8077, 'loss/train': 2.0157461166381836} +11/06/2021 22:22:36 - INFO - __main__ - Step 8079: {'lr': 0.0004979221929591663, 'samples': 1551168, 'steps': 8078, 'loss/train': 2.025535821914673} +11/06/2021 22:22:36 - INFO - __main__ - Step 8080: {'lr': 0.0004979215101379093, 'samples': 1551360, 'steps': 8079, 'loss/train': 1.8989232778549194} +11/06/2021 22:22:37 - INFO - __main__ - Step 8081: {'lr': 0.0004979208272049426, 'samples': 1551552, 'steps': 8080, 'loss/train': 1.8116631507873535} +11/06/2021 22:22:37 - INFO - __main__ - Step 8082: {'lr': 0.0004979201441602665, 'samples': 1551744, 'steps': 8081, 'loss/train': 1.6327272653579712} +11/06/2021 22:22:38 - INFO - __main__ - Step 8083: {'lr': 0.0004979194610038816, 'samples': 1551936, 'steps': 8082, 'loss/train': 2.1452510356903076} +11/06/2021 22:22:39 - INFO - __main__ - Step 8084: {'lr': 0.000497918777735788, 'samples': 1552128, 'steps': 8083, 'loss/train': 1.8749728202819824} +11/06/2021 22:22:39 - INFO - __main__ - Step 8085: {'lr': 0.000497918094355986, 'samples': 1552320, 'steps': 8084, 'loss/train': 1.904146671295166} +11/06/2021 22:22:39 - INFO - __main__ - Step 8086: {'lr': 0.000497917410864476, 'samples': 1552512, 'steps': 8085, 'loss/train': 1.7037712335586548} +11/06/2021 22:22:40 - INFO - __main__ - Step 8087: {'lr': 0.0004979167272612581, 'samples': 1552704, 'steps': 8086, 'loss/train': 1.7576018571853638} +11/06/2021 22:22:41 - INFO - __main__ - Step 8088: {'lr': 0.0004979160435463328, 'samples': 1552896, 'steps': 8087, 'loss/train': 1.7359386682510376} +11/06/2021 22:22:41 - INFO - __main__ - Step 8089: {'lr': 0.0004979153597197003, 'samples': 1553088, 'steps': 8088, 'loss/train': 1.035143256187439} +11/06/2021 22:22:41 - INFO - __main__ - Step 8090: {'lr': 0.0004979146757813611, 'samples': 1553280, 'steps': 8089, 'loss/train': 1.9019252061843872} +11/06/2021 22:22:42 - INFO - __main__ - Step 8091: {'lr': 0.0004979139917313153, 'samples': 1553472, 'steps': 8090, 'loss/train': 1.6100707054138184} +11/06/2021 22:22:42 - INFO - __main__ - Step 8092: {'lr': 0.0004979133075695634, 'samples': 1553664, 'steps': 8091, 'loss/train': 1.4543089866638184} +11/06/2021 22:22:43 - INFO - __main__ - Step 8093: {'lr': 0.0004979126232961054, 'samples': 1553856, 'steps': 8092, 'loss/train': 1.6169660091400146} +11/06/2021 22:22:43 - INFO - __main__ - Step 8094: {'lr': 0.0004979119389109419, 'samples': 1554048, 'steps': 8093, 'loss/train': 1.693862795829773} +11/06/2021 22:22:44 - INFO - __main__ - Step 8095: {'lr': 0.000497911254414073, 'samples': 1554240, 'steps': 8094, 'loss/train': 1.6328054666519165} +11/06/2021 22:22:44 - INFO - __main__ - Step 8096: {'lr': 0.0004979105698054992, 'samples': 1554432, 'steps': 8095, 'loss/train': 2.0879011154174805} +11/06/2021 22:22:44 - INFO - __main__ - Step 8097: {'lr': 0.0004979098850852208, 'samples': 1554624, 'steps': 8096, 'loss/train': 1.8429865837097168} +11/06/2021 22:22:46 - INFO - __main__ - Step 8098: {'lr': 0.0004979092002532379, 'samples': 1554816, 'steps': 8097, 'loss/train': 2.1915647983551025} +11/06/2021 22:22:46 - INFO - __main__ - Step 8099: {'lr': 0.0004979085153095509, 'samples': 1555008, 'steps': 8098, 'loss/train': 2.256697177886963} +11/06/2021 22:22:46 - INFO - __main__ - Step 8100: {'lr': 0.0004979078302541604, 'samples': 1555200, 'steps': 8099, 'loss/train': 1.6514664888381958} +11/06/2021 22:22:47 - INFO - __main__ - Step 8101: {'lr': 0.0004979071450870662, 'samples': 1555392, 'steps': 8100, 'loss/train': 1.7830842733383179} +11/06/2021 22:22:47 - INFO - __main__ - Step 8102: {'lr': 0.0004979064598082689, 'samples': 1555584, 'steps': 8101, 'loss/train': 2.325873851776123} +11/06/2021 22:22:48 - INFO - __main__ - Step 8103: {'lr': 0.0004979057744177689, 'samples': 1555776, 'steps': 8102, 'loss/train': 1.6292482614517212} +11/06/2021 22:22:48 - INFO - __main__ - Step 8104: {'lr': 0.0004979050889155663, 'samples': 1555968, 'steps': 8103, 'loss/train': 1.9589861631393433} +11/06/2021 22:22:49 - INFO - __main__ - Step 8105: {'lr': 0.0004979044033016616, 'samples': 1556160, 'steps': 8104, 'loss/train': 1.5695750713348389} +11/06/2021 22:22:49 - INFO - __main__ - Step 8106: {'lr': 0.0004979037175760548, 'samples': 1556352, 'steps': 8105, 'loss/train': 2.045214891433716} +11/06/2021 22:22:49 - INFO - __main__ - Step 8107: {'lr': 0.0004979030317387466, 'samples': 1556544, 'steps': 8106, 'loss/train': 2.292895555496216} +11/06/2021 22:22:50 - INFO - __main__ - Step 8108: {'lr': 0.0004979023457897371, 'samples': 1556736, 'steps': 8107, 'loss/train': 2.0541205406188965} +11/06/2021 22:22:51 - INFO - __main__ - Step 8109: {'lr': 0.0004979016597290264, 'samples': 1556928, 'steps': 8108, 'loss/train': 2.090756893157959} +11/06/2021 22:22:51 - INFO - __main__ - Step 8110: {'lr': 0.0004979009735566152, 'samples': 1557120, 'steps': 8109, 'loss/train': 1.956437110900879} +11/06/2021 22:22:51 - INFO - __main__ - Step 8111: {'lr': 0.0004979002872725037, 'samples': 1557312, 'steps': 8110, 'loss/train': 0.9265539050102234} +11/06/2021 22:22:52 - INFO - __main__ - Step 8112: {'lr': 0.0004978996008766922, 'samples': 1557504, 'steps': 8111, 'loss/train': 1.8253365755081177} +11/06/2021 22:22:53 - INFO - __main__ - Step 8113: {'lr': 0.0004978989143691808, 'samples': 1557696, 'steps': 8112, 'loss/train': 2.0821549892425537} +11/06/2021 22:22:54 - INFO - __main__ - Step 8114: {'lr': 0.00049789822774997, 'samples': 1557888, 'steps': 8113, 'loss/train': 1.468117356300354} +11/06/2021 22:22:54 - INFO - __main__ - Step 8115: {'lr': 0.0004978975410190601, 'samples': 1558080, 'steps': 8114, 'loss/train': 2.1024975776672363} +11/06/2021 22:22:54 - INFO - __main__ - Step 8116: {'lr': 0.0004978968541764515, 'samples': 1558272, 'steps': 8115, 'loss/train': 2.9898436069488525} +11/06/2021 22:22:55 - INFO - __main__ - Step 8117: {'lr': 0.0004978961672221444, 'samples': 1558464, 'steps': 8116, 'loss/train': 2.3070497512817383} +11/06/2021 22:22:55 - INFO - __main__ - Step 8118: {'lr': 0.000497895480156139, 'samples': 1558656, 'steps': 8117, 'loss/train': 1.9509214162826538} +11/06/2021 22:22:56 - INFO - __main__ - Step 8119: {'lr': 0.0004978947929784358, 'samples': 1558848, 'steps': 8118, 'loss/train': 1.3840776681900024} +11/06/2021 22:22:57 - INFO - __main__ - Step 8120: {'lr': 0.0004978941056890349, 'samples': 1559040, 'steps': 8119, 'loss/train': 1.7440425157546997} +11/06/2021 22:22:57 - INFO - __main__ - Step 8121: {'lr': 0.0004978934182879369, 'samples': 1559232, 'steps': 8120, 'loss/train': 1.8195523023605347} +11/06/2021 22:22:57 - INFO - __main__ - Step 8122: {'lr': 0.0004978927307751419, 'samples': 1559424, 'steps': 8121, 'loss/train': 1.3453588485717773} +11/06/2021 22:22:58 - INFO - __main__ - Step 8123: {'lr': 0.0004978920431506501, 'samples': 1559616, 'steps': 8122, 'loss/train': 1.8378467559814453} +11/06/2021 22:22:58 - INFO - __main__ - Step 8124: {'lr': 0.0004978913554144623, 'samples': 1559808, 'steps': 8123, 'loss/train': 2.123873472213745} +11/06/2021 22:22:59 - INFO - __main__ - Step 8125: {'lr': 0.0004978906675665782, 'samples': 1560000, 'steps': 8124, 'loss/train': 2.085545063018799} +11/06/2021 22:22:59 - INFO - __main__ - Step 8126: {'lr': 0.0004978899796069985, 'samples': 1560192, 'steps': 8125, 'loss/train': 1.9374345541000366} +11/06/2021 22:23:00 - INFO - __main__ - Step 8127: {'lr': 0.0004978892915357234, 'samples': 1560384, 'steps': 8126, 'loss/train': 2.0188064575195312} +11/06/2021 22:23:00 - INFO - __main__ - Step 8128: {'lr': 0.0004978886033527532, 'samples': 1560576, 'steps': 8127, 'loss/train': 2.549909830093384} +11/06/2021 22:23:00 - INFO - __main__ - Step 8129: {'lr': 0.0004978879150580882, 'samples': 1560768, 'steps': 8128, 'loss/train': 1.8509951829910278} +11/06/2021 22:23:01 - INFO - __main__ - Step 8130: {'lr': 0.0004978872266517288, 'samples': 1560960, 'steps': 8129, 'loss/train': 1.873234748840332} +11/06/2021 22:23:02 - INFO - __main__ - Step 8131: {'lr': 0.0004978865381336752, 'samples': 1561152, 'steps': 8130, 'loss/train': 1.8826571702957153} +11/06/2021 22:23:03 - INFO - __main__ - Step 8132: {'lr': 0.0004978858495039277, 'samples': 1561344, 'steps': 8131, 'loss/train': 1.34197998046875} +11/06/2021 22:23:03 - INFO - __main__ - Step 8133: {'lr': 0.0004978851607624867, 'samples': 1561536, 'steps': 8132, 'loss/train': 3.694458484649658} +11/06/2021 22:23:03 - INFO - __main__ - Step 8134: {'lr': 0.0004978844719093525, 'samples': 1561728, 'steps': 8133, 'loss/train': 2.0985944271087646} +11/06/2021 22:23:04 - INFO - __main__ - Step 8135: {'lr': 0.0004978837829445254, 'samples': 1561920, 'steps': 8134, 'loss/train': 1.7875434160232544} +11/06/2021 22:23:04 - INFO - __main__ - Step 8136: {'lr': 0.0004978830938680056, 'samples': 1562112, 'steps': 8135, 'loss/train': 1.9818612337112427} +11/06/2021 22:23:05 - INFO - __main__ - Step 8137: {'lr': 0.0004978824046797935, 'samples': 1562304, 'steps': 8136, 'loss/train': 2.647218942642212} +11/06/2021 22:23:05 - INFO - __main__ - Step 8138: {'lr': 0.0004978817153798895, 'samples': 1562496, 'steps': 8137, 'loss/train': 1.852639079093933} +11/06/2021 22:23:06 - INFO - __main__ - Step 8139: {'lr': 0.0004978810259682939, 'samples': 1562688, 'steps': 8138, 'loss/train': 1.697789192199707} +11/06/2021 22:23:06 - INFO - __main__ - Step 8140: {'lr': 0.0004978803364450068, 'samples': 1562880, 'steps': 8139, 'loss/train': 1.768872618675232} +11/06/2021 22:23:06 - INFO - __main__ - Step 8141: {'lr': 0.0004978796468100286, 'samples': 1563072, 'steps': 8140, 'loss/train': 1.7271705865859985} +11/06/2021 22:23:07 - INFO - __main__ - Step 8142: {'lr': 0.0004978789570633598, 'samples': 1563264, 'steps': 8141, 'loss/train': 2.176313638687134} +11/06/2021 22:23:08 - INFO - __main__ - Step 8143: {'lr': 0.0004978782672050004, 'samples': 1563456, 'steps': 8142, 'loss/train': 2.180102586746216} +11/06/2021 22:23:08 - INFO - __main__ - Step 8144: {'lr': 0.000497877577234951, 'samples': 1563648, 'steps': 8143, 'loss/train': 2.109963893890381} +11/06/2021 22:23:08 - INFO - __main__ - Step 8145: {'lr': 0.0004978768871532117, 'samples': 1563840, 'steps': 8144, 'loss/train': 2.1114203929901123} +11/06/2021 22:23:09 - INFO - __main__ - Step 8146: {'lr': 0.0004978761969597831, 'samples': 1564032, 'steps': 8145, 'loss/train': 2.357698917388916} +11/06/2021 22:23:09 - INFO - __main__ - Step 8147: {'lr': 0.0004978755066546651, 'samples': 1564224, 'steps': 8146, 'loss/train': 1.9668238162994385} +11/06/2021 22:23:10 - INFO - __main__ - Step 8148: {'lr': 0.0004978748162378583, 'samples': 1564416, 'steps': 8147, 'loss/train': 1.837101936340332} +11/06/2021 22:23:11 - INFO - __main__ - Step 8149: {'lr': 0.0004978741257093629, 'samples': 1564608, 'steps': 8148, 'loss/train': 2.2903544902801514} +11/06/2021 22:23:11 - INFO - __main__ - Step 8150: {'lr': 0.0004978734350691793, 'samples': 1564800, 'steps': 8149, 'loss/train': 1.4162994623184204} +11/06/2021 22:23:11 - INFO - __main__ - Step 8151: {'lr': 0.0004978727443173077, 'samples': 1564992, 'steps': 8150, 'loss/train': 1.6277093887329102} +11/06/2021 22:23:12 - INFO - __main__ - Step 8152: {'lr': 0.0004978720534537485, 'samples': 1565184, 'steps': 8151, 'loss/train': 1.715814471244812} +11/06/2021 22:23:13 - INFO - __main__ - Step 8153: {'lr': 0.000497871362478502, 'samples': 1565376, 'steps': 8152, 'loss/train': 1.4183335304260254} +11/06/2021 22:23:13 - INFO - __main__ - Step 8154: {'lr': 0.0004978706713915684, 'samples': 1565568, 'steps': 8153, 'loss/train': 1.7779927253723145} +11/06/2021 22:23:13 - INFO - __main__ - Step 8155: {'lr': 0.0004978699801929481, 'samples': 1565760, 'steps': 8154, 'loss/train': 1.3929790258407593} +11/06/2021 22:23:14 - INFO - __main__ - Step 8156: {'lr': 0.0004978692888826415, 'samples': 1565952, 'steps': 8155, 'loss/train': 1.6693589687347412} +11/06/2021 22:23:14 - INFO - __main__ - Step 8157: {'lr': 0.0004978685974606488, 'samples': 1566144, 'steps': 8156, 'loss/train': 1.4203959703445435} +11/06/2021 22:23:15 - INFO - __main__ - Step 8158: {'lr': 0.0004978679059269704, 'samples': 1566336, 'steps': 8157, 'loss/train': 1.9157639741897583} +11/06/2021 22:23:16 - INFO - __main__ - Step 8159: {'lr': 0.0004978672142816064, 'samples': 1566528, 'steps': 8158, 'loss/train': 1.5440396070480347} +11/06/2021 22:23:16 - INFO - __main__ - Step 8160: {'lr': 0.0004978665225245573, 'samples': 1566720, 'steps': 8159, 'loss/train': 1.5769977569580078} +11/06/2021 22:23:16 - INFO - __main__ - Step 8161: {'lr': 0.0004978658306558234, 'samples': 1566912, 'steps': 8160, 'loss/train': 1.9604636430740356} +11/06/2021 22:23:17 - INFO - __main__ - Step 8162: {'lr': 0.000497865138675405, 'samples': 1567104, 'steps': 8161, 'loss/train': 1.6201629638671875} +11/06/2021 22:23:18 - INFO - __main__ - Step 8163: {'lr': 0.0004978644465833024, 'samples': 1567296, 'steps': 8162, 'loss/train': 1.5474094152450562} +11/06/2021 22:23:18 - INFO - __main__ - Step 8164: {'lr': 0.000497863754379516, 'samples': 1567488, 'steps': 8163, 'loss/train': 2.2988481521606445} +11/06/2021 22:23:18 - INFO - __main__ - Step 8165: {'lr': 0.0004978630620640458, 'samples': 1567680, 'steps': 8164, 'loss/train': 1.2239776849746704} +11/06/2021 22:23:19 - INFO - __main__ - Step 8166: {'lr': 0.0004978623696368924, 'samples': 1567872, 'steps': 8165, 'loss/train': 1.8691977262496948} +11/06/2021 22:23:19 - INFO - __main__ - Step 8167: {'lr': 0.0004978616770980561, 'samples': 1568064, 'steps': 8166, 'loss/train': 1.9919401407241821} +11/06/2021 22:23:19 - INFO - __main__ - Step 8168: {'lr': 0.0004978609844475371, 'samples': 1568256, 'steps': 8167, 'loss/train': 2.040534257888794} +11/06/2021 22:23:21 - INFO - __main__ - Step 8169: {'lr': 0.0004978602916853359, 'samples': 1568448, 'steps': 8168, 'loss/train': 1.9862347841262817} +11/06/2021 22:23:21 - INFO - __main__ - Step 8170: {'lr': 0.0004978595988114525, 'samples': 1568640, 'steps': 8169, 'loss/train': 1.8854844570159912} +11/06/2021 22:23:21 - INFO - __main__ - Step 8171: {'lr': 0.0004978589058258874, 'samples': 1568832, 'steps': 8170, 'loss/train': 1.8785438537597656} +11/06/2021 22:23:22 - INFO - __main__ - Step 8172: {'lr': 0.0004978582127286409, 'samples': 1569024, 'steps': 8171, 'loss/train': 2.3725521564483643} +11/06/2021 22:23:22 - INFO - __main__ - Step 8173: {'lr': 0.0004978575195197135, 'samples': 1569216, 'steps': 8172, 'loss/train': 2.0266950130462646} +11/06/2021 22:23:23 - INFO - __main__ - Step 8174: {'lr': 0.0004978568261991051, 'samples': 1569408, 'steps': 8173, 'loss/train': 1.6820038557052612} +11/06/2021 22:23:23 - INFO - __main__ - Step 8175: {'lr': 0.0004978561327668164, 'samples': 1569600, 'steps': 8174, 'loss/train': 1.5046055316925049} +11/06/2021 22:23:24 - INFO - __main__ - Step 8176: {'lr': 0.0004978554392228475, 'samples': 1569792, 'steps': 8175, 'loss/train': 1.718424916267395} +11/06/2021 22:23:24 - INFO - __main__ - Step 8177: {'lr': 0.0004978547455671986, 'samples': 1569984, 'steps': 8176, 'loss/train': 1.3242571353912354} +11/06/2021 22:23:24 - INFO - __main__ - Step 8178: {'lr': 0.0004978540517998704, 'samples': 1570176, 'steps': 8177, 'loss/train': 1.511248230934143} +11/06/2021 22:23:25 - INFO - __main__ - Step 8179: {'lr': 0.0004978533579208629, 'samples': 1570368, 'steps': 8178, 'loss/train': 1.66165292263031} +11/06/2021 22:23:26 - INFO - __main__ - Step 8180: {'lr': 0.0004978526639301766, 'samples': 1570560, 'steps': 8179, 'loss/train': 2.0218098163604736} +11/06/2021 22:23:26 - INFO - __main__ - Step 8181: {'lr': 0.0004978519698278116, 'samples': 1570752, 'steps': 8180, 'loss/train': 2.0883474349975586} +11/06/2021 22:23:26 - INFO - __main__ - Step 8182: {'lr': 0.0004978512756137684, 'samples': 1570944, 'steps': 8181, 'loss/train': 2.5265679359436035} +11/06/2021 22:23:27 - INFO - __main__ - Step 8183: {'lr': 0.0004978505812880472, 'samples': 1571136, 'steps': 8182, 'loss/train': 1.8759024143218994} +11/06/2021 22:23:28 - INFO - __main__ - Step 8184: {'lr': 0.0004978498868506483, 'samples': 1571328, 'steps': 8183, 'loss/train': 2.0600368976593018} +11/06/2021 22:23:28 - INFO - __main__ - Step 8185: {'lr': 0.0004978491923015721, 'samples': 1571520, 'steps': 8184, 'loss/train': 1.7194626331329346} +11/06/2021 22:23:28 - INFO - __main__ - Step 8186: {'lr': 0.0004978484976408189, 'samples': 1571712, 'steps': 8185, 'loss/train': 1.817257285118103} +11/06/2021 22:23:29 - INFO - __main__ - Step 8187: {'lr': 0.000497847802868389, 'samples': 1571904, 'steps': 8186, 'loss/train': 1.9279881715774536} +11/06/2021 22:23:29 - INFO - __main__ - Step 8188: {'lr': 0.0004978471079842827, 'samples': 1572096, 'steps': 8187, 'loss/train': 1.9306005239486694} +11/06/2021 22:23:30 - INFO - __main__ - Step 8189: {'lr': 0.0004978464129885003, 'samples': 1572288, 'steps': 8188, 'loss/train': 1.9209128618240356} +11/06/2021 22:23:31 - INFO - __main__ - Step 8190: {'lr': 0.0004978457178810422, 'samples': 1572480, 'steps': 8189, 'loss/train': 0.7898921966552734} +11/06/2021 22:23:31 - INFO - __main__ - Step 8191: {'lr': 0.0004978450226619085, 'samples': 1572672, 'steps': 8190, 'loss/train': 1.9690088033676147} +11/06/2021 22:23:31 - INFO - __main__ - Step 8192: {'lr': 0.0004978443273310997, 'samples': 1572864, 'steps': 8191, 'loss/train': 1.8891528844833374} +11/06/2021 22:23:32 - INFO - __main__ - Step 8193: {'lr': 0.0004978436318886162, 'samples': 1573056, 'steps': 8192, 'loss/train': 1.6559553146362305} +11/06/2021 22:23:32 - INFO - __main__ - Step 8194: {'lr': 0.0004978429363344581, 'samples': 1573248, 'steps': 8193, 'loss/train': 0.9482629299163818} +11/06/2021 22:23:33 - INFO - __main__ - Step 8195: {'lr': 0.0004978422406686257, 'samples': 1573440, 'steps': 8194, 'loss/train': 1.9039665460586548} +11/06/2021 22:23:33 - INFO - __main__ - Step 8196: {'lr': 0.0004978415448911196, 'samples': 1573632, 'steps': 8195, 'loss/train': 1.7499048709869385} +11/06/2021 22:23:34 - INFO - __main__ - Step 8197: {'lr': 0.0004978408490019398, 'samples': 1573824, 'steps': 8196, 'loss/train': 1.526663064956665} +11/06/2021 22:23:34 - INFO - __main__ - Step 8198: {'lr': 0.0004978401530010868, 'samples': 1574016, 'steps': 8197, 'loss/train': 2.0458552837371826} +11/06/2021 22:23:35 - INFO - __main__ - Step 8199: {'lr': 0.0004978394568885608, 'samples': 1574208, 'steps': 8198, 'loss/train': 1.7852051258087158} +11/06/2021 22:23:36 - INFO - __main__ - Step 8200: {'lr': 0.0004978387606643621, 'samples': 1574400, 'steps': 8199, 'loss/train': 1.7068928480148315} +11/06/2021 22:23:36 - INFO - __main__ - Step 8201: {'lr': 0.0004978380643284912, 'samples': 1574592, 'steps': 8200, 'loss/train': 1.7486140727996826} +11/06/2021 22:23:36 - INFO - __main__ - Step 8202: {'lr': 0.0004978373678809482, 'samples': 1574784, 'steps': 8201, 'loss/train': 6.046335220336914} +11/06/2021 22:23:37 - INFO - __main__ - Step 8203: {'lr': 0.0004978366713217336, 'samples': 1574976, 'steps': 8202, 'loss/train': 1.418635368347168} +11/06/2021 22:23:37 - INFO - __main__ - Step 8204: {'lr': 0.0004978359746508476, 'samples': 1575168, 'steps': 8203, 'loss/train': 2.039991855621338} +11/06/2021 22:23:38 - INFO - __main__ - Step 8205: {'lr': 0.0004978352778682905, 'samples': 1575360, 'steps': 8204, 'loss/train': 1.6890138387680054} +11/06/2021 22:23:38 - INFO - __main__ - Step 8206: {'lr': 0.0004978345809740626, 'samples': 1575552, 'steps': 8205, 'loss/train': 1.5831921100616455} +11/06/2021 22:23:39 - INFO - __main__ - Step 8207: {'lr': 0.0004978338839681644, 'samples': 1575744, 'steps': 8206, 'loss/train': 1.284598469734192} +11/06/2021 22:23:39 - INFO - __main__ - Step 8208: {'lr': 0.000497833186850596, 'samples': 1575936, 'steps': 8207, 'loss/train': 1.9825032949447632} +11/06/2021 22:23:39 - INFO - __main__ - Step 8209: {'lr': 0.0004978324896213577, 'samples': 1576128, 'steps': 8208, 'loss/train': 1.068908929824829} +11/06/2021 22:23:40 - INFO - __main__ - Step 8210: {'lr': 0.00049783179228045, 'samples': 1576320, 'steps': 8209, 'loss/train': 2.0612127780914307} +11/06/2021 22:23:41 - INFO - __main__ - Step 8211: {'lr': 0.0004978310948278731, 'samples': 1576512, 'steps': 8210, 'loss/train': 1.5374093055725098} +11/06/2021 22:23:41 - INFO - __main__ - Step 8212: {'lr': 0.0004978303972636275, 'samples': 1576704, 'steps': 8211, 'loss/train': 1.6517690420150757} +11/06/2021 22:23:41 - INFO - __main__ - Step 8213: {'lr': 0.0004978296995877132, 'samples': 1576896, 'steps': 8212, 'loss/train': 1.9710806608200073} +11/06/2021 22:23:42 - INFO - __main__ - Step 8214: {'lr': 0.0004978290018001306, 'samples': 1577088, 'steps': 8213, 'loss/train': 1.794217824935913} +11/06/2021 22:23:42 - INFO - __main__ - Step 8215: {'lr': 0.0004978283039008801, 'samples': 1577280, 'steps': 8214, 'loss/train': 2.031745433807373} +11/06/2021 22:23:43 - INFO - __main__ - Step 8216: {'lr': 0.000497827605889962, 'samples': 1577472, 'steps': 8215, 'loss/train': 1.8105554580688477} +11/06/2021 22:23:44 - INFO - __main__ - Step 8217: {'lr': 0.0004978269077673766, 'samples': 1577664, 'steps': 8216, 'loss/train': 1.3719156980514526} +11/06/2021 22:23:44 - INFO - __main__ - Step 8218: {'lr': 0.0004978262095331243, 'samples': 1577856, 'steps': 8217, 'loss/train': 1.7575129270553589} +11/06/2021 22:23:44 - INFO - __main__ - Step 8219: {'lr': 0.0004978255111872053, 'samples': 1578048, 'steps': 8218, 'loss/train': 1.9451090097427368} +11/06/2021 22:23:45 - INFO - __main__ - Step 8220: {'lr': 0.0004978248127296198, 'samples': 1578240, 'steps': 8219, 'loss/train': 2.2303905487060547} +11/06/2021 22:23:46 - INFO - __main__ - Step 8221: {'lr': 0.0004978241141603685, 'samples': 1578432, 'steps': 8220, 'loss/train': 2.1511523723602295} +11/06/2021 22:23:46 - INFO - __main__ - Step 8222: {'lr': 0.0004978234154794514, 'samples': 1578624, 'steps': 8221, 'loss/train': 1.9754325151443481} +11/06/2021 22:23:46 - INFO - __main__ - Step 8223: {'lr': 0.0004978227166868689, 'samples': 1578816, 'steps': 8222, 'loss/train': 1.4744144678115845} +11/06/2021 22:23:47 - INFO - __main__ - Step 8224: {'lr': 0.0004978220177826212, 'samples': 1579008, 'steps': 8223, 'loss/train': 1.977313756942749} +11/06/2021 22:23:47 - INFO - __main__ - Step 8225: {'lr': 0.0004978213187667087, 'samples': 1579200, 'steps': 8224, 'loss/train': 1.9514577388763428} +11/06/2021 22:23:48 - INFO - __main__ - Step 8226: {'lr': 0.0004978206196391319, 'samples': 1579392, 'steps': 8225, 'loss/train': 1.6040639877319336} +11/06/2021 22:23:48 - INFO - __main__ - Step 8227: {'lr': 0.0004978199203998909, 'samples': 1579584, 'steps': 8226, 'loss/train': 2.2450778484344482} +11/06/2021 22:23:49 - INFO - __main__ - Step 8228: {'lr': 0.0004978192210489861, 'samples': 1579776, 'steps': 8227, 'loss/train': 1.8342416286468506} +11/06/2021 22:23:49 - INFO - __main__ - Step 8229: {'lr': 0.0004978185215864177, 'samples': 1579968, 'steps': 8228, 'loss/train': 1.8177608251571655} +11/06/2021 22:23:50 - INFO - __main__ - Step 8230: {'lr': 0.0004978178220121862, 'samples': 1580160, 'steps': 8229, 'loss/train': 1.1857390403747559} +11/06/2021 22:23:50 - INFO - __main__ - Step 8231: {'lr': 0.0004978171223262917, 'samples': 1580352, 'steps': 8230, 'loss/train': 1.4002374410629272} +11/06/2021 22:23:51 - INFO - __main__ - Step 8232: {'lr': 0.0004978164225287346, 'samples': 1580544, 'steps': 8231, 'loss/train': 1.7684195041656494} +11/06/2021 22:23:51 - INFO - __main__ - Step 8233: {'lr': 0.0004978157226195153, 'samples': 1580736, 'steps': 8232, 'loss/train': 1.4781603813171387} +11/06/2021 22:23:52 - INFO - __main__ - Step 8234: {'lr': 0.0004978150225986342, 'samples': 1580928, 'steps': 8233, 'loss/train': 1.919776439666748} +11/06/2021 22:23:52 - INFO - __main__ - Step 8235: {'lr': 0.0004978143224660913, 'samples': 1581120, 'steps': 8234, 'loss/train': 2.3026692867279053} +11/06/2021 22:23:52 - INFO - __main__ - Step 8236: {'lr': 0.0004978136222218872, 'samples': 1581312, 'steps': 8235, 'loss/train': 1.9693598747253418} +11/06/2021 22:23:53 - INFO - __main__ - Step 8237: {'lr': 0.000497812921866022, 'samples': 1581504, 'steps': 8236, 'loss/train': 2.0580477714538574} +11/06/2021 22:23:54 - INFO - __main__ - Step 8238: {'lr': 0.0004978122213984961, 'samples': 1581696, 'steps': 8237, 'loss/train': 1.808411955833435} +11/06/2021 22:23:54 - INFO - __main__ - Step 8239: {'lr': 0.00049781152081931, 'samples': 1581888, 'steps': 8238, 'loss/train': 1.9752439260482788} +11/06/2021 22:23:54 - INFO - __main__ - Step 8240: {'lr': 0.0004978108201284638, 'samples': 1582080, 'steps': 8239, 'loss/train': 0.9977089166641235} +11/06/2021 22:23:55 - INFO - __main__ - Step 8241: {'lr': 0.0004978101193259578, 'samples': 1582272, 'steps': 8240, 'loss/train': 0.3795441687107086} +11/06/2021 22:23:56 - INFO - __main__ - Step 8242: {'lr': 0.0004978094184117924, 'samples': 1582464, 'steps': 8241, 'loss/train': 1.8929859399795532} +11/06/2021 22:23:56 - INFO - __main__ - Step 8243: {'lr': 0.0004978087173859679, 'samples': 1582656, 'steps': 8242, 'loss/train': 1.606785774230957} +11/06/2021 22:23:56 - INFO - __main__ - Step 8244: {'lr': 0.0004978080162484846, 'samples': 1582848, 'steps': 8243, 'loss/train': 2.046319007873535} +11/06/2021 22:23:57 - INFO - __main__ - Step 8245: {'lr': 0.000497807314999343, 'samples': 1583040, 'steps': 8244, 'loss/train': 1.9589273929595947} +11/06/2021 22:23:57 - INFO - __main__ - Step 8246: {'lr': 0.000497806613638543, 'samples': 1583232, 'steps': 8245, 'loss/train': 1.904953956604004} +11/06/2021 22:23:58 - INFO - __main__ - Step 8247: {'lr': 0.0004978059121660853, 'samples': 1583424, 'steps': 8246, 'loss/train': 1.978081226348877} +11/06/2021 22:23:59 - INFO - __main__ - Step 8248: {'lr': 0.0004978052105819701, 'samples': 1583616, 'steps': 8247, 'loss/train': 2.0313427448272705} +11/06/2021 22:23:59 - INFO - __main__ - Step 8249: {'lr': 0.0004978045088861976, 'samples': 1583808, 'steps': 8248, 'loss/train': 2.3198392391204834} +11/06/2021 22:23:59 - INFO - __main__ - Step 8250: {'lr': 0.0004978038070787683, 'samples': 1584000, 'steps': 8249, 'loss/train': 2.009343147277832} +11/06/2021 22:24:00 - INFO - __main__ - Step 8251: {'lr': 0.0004978031051596824, 'samples': 1584192, 'steps': 8250, 'loss/train': 1.775676965713501} +11/06/2021 22:24:01 - INFO - __main__ - Step 8252: {'lr': 0.0004978024031289402, 'samples': 1584384, 'steps': 8251, 'loss/train': 1.8589789867401123} +11/06/2021 22:24:01 - INFO - __main__ - Step 8253: {'lr': 0.0004978017009865421, 'samples': 1584576, 'steps': 8252, 'loss/train': 1.619974970817566} +11/06/2021 22:24:01 - INFO - __main__ - Step 8254: {'lr': 0.0004978009987324884, 'samples': 1584768, 'steps': 8253, 'loss/train': 1.9142787456512451} +11/06/2021 22:24:02 - INFO - __main__ - Step 8255: {'lr': 0.0004978002963667794, 'samples': 1584960, 'steps': 8254, 'loss/train': 1.2939250469207764} +11/06/2021 22:24:02 - INFO - __main__ - Step 8256: {'lr': 0.0004977995938894153, 'samples': 1585152, 'steps': 8255, 'loss/train': 2.2025363445281982} +11/06/2021 22:24:03 - INFO - __main__ - Step 8257: {'lr': 0.0004977988913003966, 'samples': 1585344, 'steps': 8256, 'loss/train': 2.0969882011413574} +11/06/2021 22:24:03 - INFO - __main__ - Step 8258: {'lr': 0.0004977981885997235, 'samples': 1585536, 'steps': 8257, 'loss/train': 1.3908742666244507} +11/06/2021 22:24:04 - INFO - __main__ - Step 8259: {'lr': 0.0004977974857873964, 'samples': 1585728, 'steps': 8258, 'loss/train': 1.7966902256011963} +11/06/2021 22:24:04 - INFO - __main__ - Step 8260: {'lr': 0.0004977967828634157, 'samples': 1585920, 'steps': 8259, 'loss/train': 1.8227860927581787} +11/06/2021 22:24:05 - INFO - __main__ - Step 8261: {'lr': 0.0004977960798277814, 'samples': 1586112, 'steps': 8260, 'loss/train': 1.9070138931274414} +11/06/2021 22:24:05 - INFO - __main__ - Step 8262: {'lr': 0.0004977953766804941, 'samples': 1586304, 'steps': 8261, 'loss/train': 1.7750216722488403} +11/06/2021 22:24:06 - INFO - __main__ - Step 8263: {'lr': 0.0004977946734215541, 'samples': 1586496, 'steps': 8262, 'loss/train': 1.3663748502731323} +11/06/2021 22:24:06 - INFO - __main__ - Step 8264: {'lr': 0.0004977939700509615, 'samples': 1586688, 'steps': 8263, 'loss/train': 2.318755626678467} +11/06/2021 22:24:07 - INFO - __main__ - Step 8265: {'lr': 0.0004977932665687168, 'samples': 1586880, 'steps': 8264, 'loss/train': 1.6168603897094727} +11/06/2021 22:24:07 - INFO - __main__ - Step 8266: {'lr': 0.0004977925629748203, 'samples': 1587072, 'steps': 8265, 'loss/train': 1.8348907232284546} +11/06/2021 22:24:07 - INFO - __main__ - Step 8267: {'lr': 0.0004977918592692723, 'samples': 1587264, 'steps': 8266, 'loss/train': 2.0127944946289062} +11/06/2021 22:24:08 - INFO - __main__ - Step 8268: {'lr': 0.0004977911554520731, 'samples': 1587456, 'steps': 8267, 'loss/train': 2.4717700481414795} +11/06/2021 22:24:09 - INFO - __main__ - Step 8269: {'lr': 0.000497790451523223, 'samples': 1587648, 'steps': 8268, 'loss/train': 1.848479151725769} +11/06/2021 22:24:09 - INFO - __main__ - Step 8270: {'lr': 0.0004977897474827224, 'samples': 1587840, 'steps': 8269, 'loss/train': 2.058631420135498} +11/06/2021 22:24:09 - INFO - __main__ - Step 8271: {'lr': 0.0004977890433305716, 'samples': 1588032, 'steps': 8270, 'loss/train': 2.1743407249450684} +11/06/2021 22:24:10 - INFO - __main__ - Step 8272: {'lr': 0.0004977883390667707, 'samples': 1588224, 'steps': 8271, 'loss/train': 1.7695982456207275} +11/06/2021 22:24:11 - INFO - __main__ - Step 8273: {'lr': 0.0004977876346913204, 'samples': 1588416, 'steps': 8272, 'loss/train': 1.5789722204208374} +11/06/2021 22:24:11 - INFO - __main__ - Step 8274: {'lr': 0.0004977869302042207, 'samples': 1588608, 'steps': 8273, 'loss/train': 1.8004614114761353} +11/06/2021 22:24:12 - INFO - __main__ - Step 8275: {'lr': 0.0004977862256054721, 'samples': 1588800, 'steps': 8274, 'loss/train': 1.8264741897583008} +11/06/2021 22:24:12 - INFO - __main__ - Step 8276: {'lr': 0.0004977855208950748, 'samples': 1588992, 'steps': 8275, 'loss/train': 1.8771971464157104} +11/06/2021 22:24:12 - INFO - __main__ - Step 8277: {'lr': 0.0004977848160730292, 'samples': 1589184, 'steps': 8276, 'loss/train': 1.6610857248306274} +11/06/2021 22:24:13 - INFO - __main__ - Step 8278: {'lr': 0.0004977841111393356, 'samples': 1589376, 'steps': 8277, 'loss/train': 1.7846906185150146} +11/06/2021 22:24:14 - INFO - __main__ - Step 8279: {'lr': 0.0004977834060939943, 'samples': 1589568, 'steps': 8278, 'loss/train': 1.6243547201156616} +11/06/2021 22:24:14 - INFO - __main__ - Step 8280: {'lr': 0.0004977827009370056, 'samples': 1589760, 'steps': 8279, 'loss/train': 1.42178475856781} +11/06/2021 22:24:14 - INFO - __main__ - Step 8281: {'lr': 0.0004977819956683698, 'samples': 1589952, 'steps': 8280, 'loss/train': 1.8669449090957642} +11/06/2021 22:24:15 - INFO - __main__ - Step 8282: {'lr': 0.0004977812902880873, 'samples': 1590144, 'steps': 8281, 'loss/train': 2.0661544799804688} +11/06/2021 22:24:15 - INFO - __main__ - Step 8283: {'lr': 0.0004977805847961584, 'samples': 1590336, 'steps': 8282, 'loss/train': 1.9494577646255493} +11/06/2021 22:24:16 - INFO - __main__ - Step 8284: {'lr': 0.0004977798791925834, 'samples': 1590528, 'steps': 8283, 'loss/train': 1.9344879388809204} +11/06/2021 22:24:16 - INFO - __main__ - Step 8285: {'lr': 0.0004977791734773624, 'samples': 1590720, 'steps': 8284, 'loss/train': 1.7498496770858765} +11/06/2021 22:24:17 - INFO - __main__ - Step 8286: {'lr': 0.0004977784676504962, 'samples': 1590912, 'steps': 8285, 'loss/train': 1.4974678754806519} +11/06/2021 22:24:17 - INFO - __main__ - Step 8287: {'lr': 0.0004977777617119847, 'samples': 1591104, 'steps': 8286, 'loss/train': 1.8675819635391235} +11/06/2021 22:24:18 - INFO - __main__ - Step 8288: {'lr': 0.0004977770556618284, 'samples': 1591296, 'steps': 8287, 'loss/train': 2.119424343109131} +11/06/2021 22:24:18 - INFO - __main__ - Step 8289: {'lr': 0.0004977763495000276, 'samples': 1591488, 'steps': 8288, 'loss/train': 1.7665525674819946} +11/06/2021 22:24:19 - INFO - __main__ - Step 8290: {'lr': 0.0004977756432265827, 'samples': 1591680, 'steps': 8289, 'loss/train': 1.5919955968856812} +11/06/2021 22:24:19 - INFO - __main__ - Step 8291: {'lr': 0.0004977749368414937, 'samples': 1591872, 'steps': 8290, 'loss/train': 1.6842032670974731} +11/06/2021 22:24:20 - INFO - __main__ - Step 8292: {'lr': 0.0004977742303447613, 'samples': 1592064, 'steps': 8291, 'loss/train': 2.4035115242004395} +11/06/2021 22:24:20 - INFO - __main__ - Step 8293: {'lr': 0.0004977735237363855, 'samples': 1592256, 'steps': 8292, 'loss/train': 1.7982686758041382} +11/06/2021 22:24:21 - INFO - __main__ - Step 8294: {'lr': 0.0004977728170163669, 'samples': 1592448, 'steps': 8293, 'loss/train': 2.0274014472961426} +11/06/2021 22:24:21 - INFO - __main__ - Step 8295: {'lr': 0.0004977721101847057, 'samples': 1592640, 'steps': 8294, 'loss/train': 2.058189868927002} +11/06/2021 22:24:22 - INFO - __main__ - Step 8296: {'lr': 0.0004977714032414021, 'samples': 1592832, 'steps': 8295, 'loss/train': 1.709094762802124} +11/06/2021 22:24:22 - INFO - __main__ - Step 8297: {'lr': 0.0004977706961864566, 'samples': 1593024, 'steps': 8296, 'loss/train': 2.004429578781128} +11/06/2021 22:24:22 - INFO - __main__ - Step 8298: {'lr': 0.0004977699890198695, 'samples': 1593216, 'steps': 8297, 'loss/train': 0.9048164486885071} +11/06/2021 22:24:23 - INFO - __main__ - Step 8299: {'lr': 0.0004977692817416411, 'samples': 1593408, 'steps': 8298, 'loss/train': 1.415739893913269} +11/06/2021 22:24:24 - INFO - __main__ - Step 8300: {'lr': 0.0004977685743517715, 'samples': 1593600, 'steps': 8299, 'loss/train': 1.8536925315856934} +11/06/2021 22:24:24 - INFO - __main__ - Step 8301: {'lr': 0.0004977678668502614, 'samples': 1593792, 'steps': 8300, 'loss/train': 2.0791187286376953} +11/06/2021 22:24:24 - INFO - __main__ - Step 8302: {'lr': 0.0004977671592371108, 'samples': 1593984, 'steps': 8301, 'loss/train': 0.7785729765892029} +11/06/2021 22:24:25 - INFO - __main__ - Step 8303: {'lr': 0.0004977664515123201, 'samples': 1594176, 'steps': 8302, 'loss/train': 1.8622348308563232} +11/06/2021 22:24:26 - INFO - __main__ - Step 8304: {'lr': 0.0004977657436758898, 'samples': 1594368, 'steps': 8303, 'loss/train': 1.9687023162841797} +11/06/2021 22:24:26 - INFO - __main__ - Step 8305: {'lr': 0.00049776503572782, 'samples': 1594560, 'steps': 8304, 'loss/train': 1.782356858253479} +11/06/2021 22:24:27 - INFO - __main__ - Step 8306: {'lr': 0.0004977643276681111, 'samples': 1594752, 'steps': 8305, 'loss/train': 1.6314135789871216} +11/06/2021 22:24:27 - INFO - __main__ - Step 8307: {'lr': 0.0004977636194967634, 'samples': 1594944, 'steps': 8306, 'loss/train': 2.114375591278076} +11/06/2021 22:24:27 - INFO - __main__ - Step 8308: {'lr': 0.0004977629112137773, 'samples': 1595136, 'steps': 8307, 'loss/train': 1.4448978900909424} +11/06/2021 22:24:28 - INFO - __main__ - Step 8309: {'lr': 0.000497762202819153, 'samples': 1595328, 'steps': 8308, 'loss/train': 2.2745602130889893} +11/06/2021 22:24:29 - INFO - __main__ - Step 8310: {'lr': 0.0004977614943128909, 'samples': 1595520, 'steps': 8309, 'loss/train': 2.14582896232605} +11/06/2021 22:24:29 - INFO - __main__ - Step 8311: {'lr': 0.0004977607856949913, 'samples': 1595712, 'steps': 8310, 'loss/train': 1.7548679113388062} +11/06/2021 22:24:29 - INFO - __main__ - Step 8312: {'lr': 0.0004977600769654545, 'samples': 1595904, 'steps': 8311, 'loss/train': 1.5743494033813477} +11/06/2021 22:24:30 - INFO - __main__ - Step 8313: {'lr': 0.0004977593681242808, 'samples': 1596096, 'steps': 8312, 'loss/train': 2.279632806777954} +11/06/2021 22:24:30 - INFO - __main__ - Step 8314: {'lr': 0.0004977586591714706, 'samples': 1596288, 'steps': 8313, 'loss/train': 2.477036714553833} +11/06/2021 22:24:31 - INFO - __main__ - Step 8315: {'lr': 0.0004977579501070241, 'samples': 1596480, 'steps': 8314, 'loss/train': 1.5748059749603271} +11/06/2021 22:24:31 - INFO - __main__ - Step 8316: {'lr': 0.0004977572409309418, 'samples': 1596672, 'steps': 8315, 'loss/train': 1.7749756574630737} +11/06/2021 22:24:32 - INFO - __main__ - Step 8317: {'lr': 0.0004977565316432238, 'samples': 1596864, 'steps': 8316, 'loss/train': 2.0671162605285645} +11/06/2021 22:24:32 - INFO - __main__ - Step 8318: {'lr': 0.0004977558222438707, 'samples': 1597056, 'steps': 8317, 'loss/train': 1.9523950815200806} +11/06/2021 22:24:33 - INFO - __main__ - Step 8319: {'lr': 0.0004977551127328824, 'samples': 1597248, 'steps': 8318, 'loss/train': 1.767422080039978} +11/06/2021 22:24:34 - INFO - __main__ - Step 8320: {'lr': 0.0004977544031102597, 'samples': 1597440, 'steps': 8319, 'loss/train': 1.7613978385925293} +11/06/2021 22:24:34 - INFO - __main__ - Step 8321: {'lr': 0.0004977536933760025, 'samples': 1597632, 'steps': 8320, 'loss/train': 1.8801629543304443} +11/06/2021 22:24:34 - INFO - __main__ - Step 8322: {'lr': 0.0004977529835301115, 'samples': 1597824, 'steps': 8321, 'loss/train': 1.653210163116455} +11/06/2021 22:24:35 - INFO - __main__ - Step 8323: {'lr': 0.0004977522735725866, 'samples': 1598016, 'steps': 8322, 'loss/train': 1.4604030847549438} +11/06/2021 22:24:35 - INFO - __main__ - Step 8324: {'lr': 0.0004977515635034285, 'samples': 1598208, 'steps': 8323, 'loss/train': 1.7190172672271729} +11/06/2021 22:24:36 - INFO - __main__ - Step 8325: {'lr': 0.0004977508533226374, 'samples': 1598400, 'steps': 8324, 'loss/train': 1.7144981622695923} +11/06/2021 22:24:36 - INFO - __main__ - Step 8326: {'lr': 0.0004977501430302136, 'samples': 1598592, 'steps': 8325, 'loss/train': 2.134070873260498} +11/06/2021 22:24:37 - INFO - __main__ - Step 8327: {'lr': 0.0004977494326261573, 'samples': 1598784, 'steps': 8326, 'loss/train': 2.0011684894561768} +11/06/2021 22:24:37 - INFO - __main__ - Step 8328: {'lr': 0.000497748722110469, 'samples': 1598976, 'steps': 8327, 'loss/train': 3.0373826026916504} +11/06/2021 22:24:38 - INFO - __main__ - Step 8329: {'lr': 0.0004977480114831489, 'samples': 1599168, 'steps': 8328, 'loss/train': 1.5927302837371826} +11/06/2021 22:24:38 - INFO - __main__ - Step 8330: {'lr': 0.0004977473007441973, 'samples': 1599360, 'steps': 8329, 'loss/train': 1.6622514724731445} +11/06/2021 22:24:39 - INFO - __main__ - Step 8331: {'lr': 0.0004977465898936147, 'samples': 1599552, 'steps': 8330, 'loss/train': 2.2087743282318115} +11/06/2021 22:24:39 - INFO - __main__ - Step 8332: {'lr': 0.0004977458789314014, 'samples': 1599744, 'steps': 8331, 'loss/train': 2.013927936553955} +11/06/2021 22:24:40 - INFO - __main__ - Step 8333: {'lr': 0.0004977451678575575, 'samples': 1599936, 'steps': 8332, 'loss/train': 1.207032561302185} +11/06/2021 22:24:40 - INFO - __main__ - Step 8334: {'lr': 0.0004977444566720834, 'samples': 1600128, 'steps': 8333, 'loss/train': 1.9208728075027466} +11/06/2021 22:24:40 - INFO - __main__ - Step 8335: {'lr': 0.0004977437453749795, 'samples': 1600320, 'steps': 8334, 'loss/train': 1.8534126281738281} +11/06/2021 22:24:42 - INFO - __main__ - Step 8336: {'lr': 0.0004977430339662462, 'samples': 1600512, 'steps': 8335, 'loss/train': 2.3053481578826904} +11/06/2021 22:24:42 - INFO - __main__ - Step 8337: {'lr': 0.0004977423224458837, 'samples': 1600704, 'steps': 8336, 'loss/train': 1.7347732782363892} +11/06/2021 22:24:42 - INFO - __main__ - Step 8338: {'lr': 0.0004977416108138922, 'samples': 1600896, 'steps': 8337, 'loss/train': 1.3853802680969238} +11/06/2021 22:24:43 - INFO - __main__ - Step 8339: {'lr': 0.0004977408990702722, 'samples': 1601088, 'steps': 8338, 'loss/train': 1.826993465423584} +11/06/2021 22:24:43 - INFO - __main__ - Step 8340: {'lr': 0.0004977401872150241, 'samples': 1601280, 'steps': 8339, 'loss/train': 1.857647180557251} +11/06/2021 22:24:44 - INFO - __main__ - Step 8341: {'lr': 0.000497739475248148, 'samples': 1601472, 'steps': 8340, 'loss/train': 1.9734106063842773} +11/06/2021 22:24:44 - INFO - __main__ - Step 8342: {'lr': 0.0004977387631696443, 'samples': 1601664, 'steps': 8341, 'loss/train': 1.5935910940170288} +11/06/2021 22:24:45 - INFO - __main__ - Step 8343: {'lr': 0.0004977380509795133, 'samples': 1601856, 'steps': 8342, 'loss/train': 1.8237578868865967} +11/06/2021 22:24:45 - INFO - __main__ - Step 8344: {'lr': 0.0004977373386777554, 'samples': 1602048, 'steps': 8343, 'loss/train': 2.0518319606781006} +11/06/2021 22:24:45 - INFO - __main__ - Step 8345: {'lr': 0.0004977366262643709, 'samples': 1602240, 'steps': 8344, 'loss/train': 2.2713077068328857} +11/06/2021 22:24:46 - INFO - __main__ - Step 8346: {'lr': 0.0004977359137393601, 'samples': 1602432, 'steps': 8345, 'loss/train': 1.824563980102539} +11/06/2021 22:24:47 - INFO - __main__ - Step 8347: {'lr': 0.0004977352011027233, 'samples': 1602624, 'steps': 8346, 'loss/train': 2.087007999420166} +11/06/2021 22:24:47 - INFO - __main__ - Step 8348: {'lr': 0.0004977344883544608, 'samples': 1602816, 'steps': 8347, 'loss/train': 1.990113615989685} +11/06/2021 22:24:47 - INFO - __main__ - Step 8349: {'lr': 0.0004977337754945731, 'samples': 1603008, 'steps': 8348, 'loss/train': 1.9418188333511353} +11/06/2021 22:24:48 - INFO - __main__ - Step 8350: {'lr': 0.0004977330625230603, 'samples': 1603200, 'steps': 8349, 'loss/train': 1.706646203994751} +11/06/2021 22:24:49 - INFO - __main__ - Step 8351: {'lr': 0.0004977323494399227, 'samples': 1603392, 'steps': 8350, 'loss/train': 2.1837000846862793} +11/06/2021 22:24:49 - INFO - __main__ - Step 8352: {'lr': 0.0004977316362451608, 'samples': 1603584, 'steps': 8351, 'loss/train': 1.3790884017944336} +11/06/2021 22:24:50 - INFO - __main__ - Step 8353: {'lr': 0.0004977309229387749, 'samples': 1603776, 'steps': 8352, 'loss/train': 2.0610451698303223} +11/06/2021 22:24:50 - INFO - __main__ - Step 8354: {'lr': 0.0004977302095207653, 'samples': 1603968, 'steps': 8353, 'loss/train': 1.990189552307129} +11/06/2021 22:24:50 - INFO - __main__ - Step 8355: {'lr': 0.0004977294959911322, 'samples': 1604160, 'steps': 8354, 'loss/train': 1.6748875379562378} +11/06/2021 22:24:51 - INFO - __main__ - Step 8356: {'lr': 0.0004977287823498761, 'samples': 1604352, 'steps': 8355, 'loss/train': 2.276111602783203} +11/06/2021 22:24:52 - INFO - __main__ - Step 8357: {'lr': 0.0004977280685969971, 'samples': 1604544, 'steps': 8356, 'loss/train': 2.2838523387908936} +11/06/2021 22:24:52 - INFO - __main__ - Step 8358: {'lr': 0.0004977273547324958, 'samples': 1604736, 'steps': 8357, 'loss/train': 2.2760424613952637} +11/06/2021 22:24:52 - INFO - __main__ - Step 8359: {'lr': 0.0004977266407563722, 'samples': 1604928, 'steps': 8358, 'loss/train': 3.90104079246521} +11/06/2021 22:24:53 - INFO - __main__ - Step 8360: {'lr': 0.0004977259266686269, 'samples': 1605120, 'steps': 8359, 'loss/train': 1.3751955032348633} +11/06/2021 22:24:54 - INFO - __main__ - Step 8361: {'lr': 0.0004977252124692601, 'samples': 1605312, 'steps': 8360, 'loss/train': 1.8619705438613892} +11/06/2021 22:24:54 - INFO - __main__ - Step 8362: {'lr': 0.0004977244981582723, 'samples': 1605504, 'steps': 8361, 'loss/train': 1.7409098148345947} +11/06/2021 22:24:54 - INFO - __main__ - Step 8363: {'lr': 0.0004977237837356634, 'samples': 1605696, 'steps': 8362, 'loss/train': 1.7340418100357056} +11/06/2021 22:24:55 - INFO - __main__ - Step 8364: {'lr': 0.0004977230692014341, 'samples': 1605888, 'steps': 8363, 'loss/train': 1.5807855129241943} +11/06/2021 22:24:55 - INFO - __main__ - Step 8365: {'lr': 0.0004977223545555847, 'samples': 1606080, 'steps': 8364, 'loss/train': 1.9046440124511719} +11/06/2021 22:24:56 - INFO - __main__ - Step 8366: {'lr': 0.0004977216397981153, 'samples': 1606272, 'steps': 8365, 'loss/train': 1.9120842218399048} +11/06/2021 22:24:56 - INFO - __main__ - Step 8367: {'lr': 0.0004977209249290264, 'samples': 1606464, 'steps': 8366, 'loss/train': 1.9572821855545044} +11/06/2021 22:24:57 - INFO - __main__ - Step 8368: {'lr': 0.0004977202099483184, 'samples': 1606656, 'steps': 8367, 'loss/train': 2.009401559829712} +11/06/2021 22:24:57 - INFO - __main__ - Step 8369: {'lr': 0.0004977194948559913, 'samples': 1606848, 'steps': 8368, 'loss/train': 1.6611480712890625} +11/06/2021 22:24:58 - INFO - __main__ - Step 8370: {'lr': 0.0004977187796520457, 'samples': 1607040, 'steps': 8369, 'loss/train': 1.6625375747680664} +11/06/2021 22:24:58 - INFO - __main__ - Step 8371: {'lr': 0.0004977180643364819, 'samples': 1607232, 'steps': 8370, 'loss/train': 1.967087984085083} +11/06/2021 22:24:59 - INFO - __main__ - Step 8372: {'lr': 0.0004977173489093, 'samples': 1607424, 'steps': 8371, 'loss/train': 1.945002555847168} +11/06/2021 22:24:59 - INFO - __main__ - Step 8373: {'lr': 0.0004977166333705005, 'samples': 1607616, 'steps': 8372, 'loss/train': 1.0230144262313843} +11/06/2021 22:25:00 - INFO - __main__ - Step 8374: {'lr': 0.0004977159177200839, 'samples': 1607808, 'steps': 8373, 'loss/train': 1.9832271337509155} +11/06/2021 22:25:00 - INFO - __main__ - Step 8375: {'lr': 0.0004977152019580502, 'samples': 1608000, 'steps': 8374, 'loss/train': 1.5450023412704468} +11/06/2021 22:25:00 - INFO - __main__ - Step 8376: {'lr': 0.0004977144860843998, 'samples': 1608192, 'steps': 8375, 'loss/train': 1.7388193607330322} +11/06/2021 22:25:01 - INFO - __main__ - Step 8377: {'lr': 0.0004977137700991332, 'samples': 1608384, 'steps': 8376, 'loss/train': 1.4530218839645386} +11/06/2021 22:25:02 - INFO - __main__ - Step 8378: {'lr': 0.0004977130540022506, 'samples': 1608576, 'steps': 8377, 'loss/train': 1.5566548109054565} +11/06/2021 22:25:02 - INFO - __main__ - Step 8379: {'lr': 0.0004977123377937523, 'samples': 1608768, 'steps': 8378, 'loss/train': 1.7430671453475952} +11/06/2021 22:25:02 - INFO - __main__ - Step 8380: {'lr': 0.0004977116214736385, 'samples': 1608960, 'steps': 8379, 'loss/train': 1.1904152631759644} +11/06/2021 22:25:03 - INFO - __main__ - Step 8381: {'lr': 0.0004977109050419097, 'samples': 1609152, 'steps': 8380, 'loss/train': 2.402639150619507} +11/06/2021 22:25:04 - INFO - __main__ - Step 8382: {'lr': 0.0004977101884985663, 'samples': 1609344, 'steps': 8381, 'loss/train': 1.059557557106018} +11/06/2021 22:25:04 - INFO - __main__ - Step 8383: {'lr': 0.0004977094718436085, 'samples': 1609536, 'steps': 8382, 'loss/train': 1.9162335395812988} +11/06/2021 22:25:04 - INFO - __main__ - Step 8384: {'lr': 0.0004977087550770366, 'samples': 1609728, 'steps': 8383, 'loss/train': 1.9313476085662842} +11/06/2021 22:25:05 - INFO - __main__ - Step 8385: {'lr': 0.000497708038198851, 'samples': 1609920, 'steps': 8384, 'loss/train': 1.6063017845153809} +11/06/2021 22:25:05 - INFO - __main__ - Step 8386: {'lr': 0.0004977073212090519, 'samples': 1610112, 'steps': 8385, 'loss/train': 1.8818663358688354} +11/06/2021 22:25:06 - INFO - __main__ - Step 8387: {'lr': 0.0004977066041076398, 'samples': 1610304, 'steps': 8386, 'loss/train': 1.9069045782089233} +11/06/2021 22:25:06 - INFO - __main__ - Step 8388: {'lr': 0.0004977058868946148, 'samples': 1610496, 'steps': 8387, 'loss/train': 2.062808036804199} +11/06/2021 22:25:07 - INFO - __main__ - Step 8389: {'lr': 0.0004977051695699775, 'samples': 1610688, 'steps': 8388, 'loss/train': 1.8666964769363403} +11/06/2021 22:25:07 - INFO - __main__ - Step 8390: {'lr': 0.000497704452133728, 'samples': 1610880, 'steps': 8389, 'loss/train': 2.0732336044311523} +11/06/2021 22:25:08 - INFO - __main__ - Step 8391: {'lr': 0.0004977037345858667, 'samples': 1611072, 'steps': 8390, 'loss/train': 2.5039222240448} +11/06/2021 22:25:09 - INFO - __main__ - Step 8392: {'lr': 0.0004977030169263938, 'samples': 1611264, 'steps': 8391, 'loss/train': 1.8938769102096558} +11/06/2021 22:25:09 - INFO - __main__ - Step 8393: {'lr': 0.0004977022991553099, 'samples': 1611456, 'steps': 8392, 'loss/train': 1.8383945226669312} +11/06/2021 22:25:09 - INFO - __main__ - Step 8394: {'lr': 0.0004977015812726151, 'samples': 1611648, 'steps': 8393, 'loss/train': 1.9845424890518188} +11/06/2021 22:25:10 - INFO - __main__ - Step 8395: {'lr': 0.0004977008632783098, 'samples': 1611840, 'steps': 8394, 'loss/train': 1.7527318000793457} +11/06/2021 22:25:10 - INFO - __main__ - Step 8396: {'lr': 0.0004977001451723944, 'samples': 1612032, 'steps': 8395, 'loss/train': 0.8850865364074707} +11/06/2021 22:25:10 - INFO - __main__ - Step 8397: {'lr': 0.000497699426954869, 'samples': 1612224, 'steps': 8396, 'loss/train': 1.9200553894042969} +11/06/2021 22:25:11 - INFO - __main__ - Step 8398: {'lr': 0.0004976987086257342, 'samples': 1612416, 'steps': 8397, 'loss/train': 1.0962588787078857} +11/06/2021 22:25:12 - INFO - __main__ - Step 8399: {'lr': 0.0004976979901849901, 'samples': 1612608, 'steps': 8398, 'loss/train': 1.736077070236206} +11/06/2021 22:25:12 - INFO - __main__ - Step 8400: {'lr': 0.000497697271632637, 'samples': 1612800, 'steps': 8399, 'loss/train': 1.651288390159607} +11/06/2021 22:25:12 - INFO - __main__ - Step 8401: {'lr': 0.0004976965529686756, 'samples': 1612992, 'steps': 8400, 'loss/train': 1.851194977760315} +11/06/2021 22:25:13 - INFO - __main__ - Step 8402: {'lr': 0.0004976958341931057, 'samples': 1613184, 'steps': 8401, 'loss/train': 1.0811164379119873} +11/06/2021 22:25:14 - INFO - __main__ - Step 8403: {'lr': 0.000497695115305928, 'samples': 1613376, 'steps': 8402, 'loss/train': 1.9029980897903442} +11/06/2021 22:25:14 - INFO - __main__ - Step 8404: {'lr': 0.0004976943963071426, 'samples': 1613568, 'steps': 8403, 'loss/train': 1.7651731967926025} +11/06/2021 22:25:15 - INFO - __main__ - Step 8405: {'lr': 0.0004976936771967501, 'samples': 1613760, 'steps': 8404, 'loss/train': 2.381589412689209} +11/06/2021 22:25:15 - INFO - __main__ - Step 8406: {'lr': 0.0004976929579747505, 'samples': 1613952, 'steps': 8405, 'loss/train': 1.7756294012069702} +11/06/2021 22:25:15 - INFO - __main__ - Step 8407: {'lr': 0.0004976922386411444, 'samples': 1614144, 'steps': 8406, 'loss/train': 2.137291669845581} +11/06/2021 22:25:16 - INFO - __main__ - Step 8408: {'lr': 0.0004976915191959319, 'samples': 1614336, 'steps': 8407, 'loss/train': 1.879096508026123} +11/06/2021 22:25:17 - INFO - __main__ - Step 8409: {'lr': 0.0004976907996391135, 'samples': 1614528, 'steps': 8408, 'loss/train': 1.870473861694336} +11/06/2021 22:25:17 - INFO - __main__ - Step 8410: {'lr': 0.0004976900799706894, 'samples': 1614720, 'steps': 8409, 'loss/train': 2.050117015838623} +11/06/2021 22:25:17 - INFO - __main__ - Step 8411: {'lr': 0.00049768936019066, 'samples': 1614912, 'steps': 8410, 'loss/train': 1.824702262878418} +11/06/2021 22:25:18 - INFO - __main__ - Step 8412: {'lr': 0.0004976886402990255, 'samples': 1615104, 'steps': 8411, 'loss/train': 1.77139413356781} +11/06/2021 22:25:19 - INFO - __main__ - Step 8413: {'lr': 0.0004976879202957864, 'samples': 1615296, 'steps': 8412, 'loss/train': 1.8707973957061768} +11/06/2021 22:25:19 - INFO - __main__ - Step 8414: {'lr': 0.000497687200180943, 'samples': 1615488, 'steps': 8413, 'loss/train': 1.7304356098175049} +11/06/2021 22:25:19 - INFO - __main__ - Step 8415: {'lr': 0.0004976864799544954, 'samples': 1615680, 'steps': 8414, 'loss/train': 1.8535863161087036} +11/06/2021 22:25:20 - INFO - __main__ - Step 8416: {'lr': 0.0004976857596164443, 'samples': 1615872, 'steps': 8415, 'loss/train': 1.761738896369934} +11/06/2021 22:25:20 - INFO - __main__ - Step 8417: {'lr': 0.0004976850391667897, 'samples': 1616064, 'steps': 8416, 'loss/train': 1.0257487297058105} +11/06/2021 22:25:21 - INFO - __main__ - Step 8418: {'lr': 0.0004976843186055321, 'samples': 1616256, 'steps': 8417, 'loss/train': 1.9058445692062378} +11/06/2021 22:25:21 - INFO - __main__ - Step 8419: {'lr': 0.0004976835979326718, 'samples': 1616448, 'steps': 8418, 'loss/train': 1.5903434753417969} +11/06/2021 22:25:22 - INFO - __main__ - Step 8420: {'lr': 0.0004976828771482089, 'samples': 1616640, 'steps': 8419, 'loss/train': 1.9769971370697021} +11/06/2021 22:25:22 - INFO - __main__ - Step 8421: {'lr': 0.0004976821562521441, 'samples': 1616832, 'steps': 8420, 'loss/train': 1.9733790159225464} +11/06/2021 22:25:22 - INFO - __main__ - Step 8422: {'lr': 0.0004976814352444775, 'samples': 1617024, 'steps': 8421, 'loss/train': 1.1663745641708374} +11/06/2021 22:25:24 - INFO - __main__ - Step 8423: {'lr': 0.0004976807141252094, 'samples': 1617216, 'steps': 8422, 'loss/train': 1.938113808631897} +11/06/2021 22:25:24 - INFO - __main__ - Step 8424: {'lr': 0.0004976799928943403, 'samples': 1617408, 'steps': 8423, 'loss/train': 0.9520623683929443} +11/06/2021 22:25:25 - INFO - __main__ - Step 8425: {'lr': 0.0004976792715518703, 'samples': 1617600, 'steps': 8424, 'loss/train': 2.006859302520752} +11/06/2021 22:25:25 - INFO - __main__ - Step 8426: {'lr': 0.0004976785500978, 'samples': 1617792, 'steps': 8425, 'loss/train': 1.5716438293457031} +11/06/2021 22:25:25 - INFO - __main__ - Step 8427: {'lr': 0.0004976778285321294, 'samples': 1617984, 'steps': 8426, 'loss/train': 1.7659454345703125} +11/06/2021 22:25:26 - INFO - __main__ - Step 8428: {'lr': 0.0004976771068548591, 'samples': 1618176, 'steps': 8427, 'loss/train': 2.2531676292419434} +11/06/2021 22:25:27 - INFO - __main__ - Step 8429: {'lr': 0.0004976763850659893, 'samples': 1618368, 'steps': 8428, 'loss/train': 0.3412085175514221} +11/06/2021 22:25:27 - INFO - __main__ - Step 8430: {'lr': 0.0004976756631655203, 'samples': 1618560, 'steps': 8429, 'loss/train': 1.789984941482544} +11/06/2021 22:25:27 - INFO - __main__ - Step 8431: {'lr': 0.0004976749411534525, 'samples': 1618752, 'steps': 8430, 'loss/train': 1.566307783126831} +11/06/2021 22:25:28 - INFO - __main__ - Step 8432: {'lr': 0.0004976742190297862, 'samples': 1618944, 'steps': 8431, 'loss/train': 2.2874772548675537} +11/06/2021 22:25:28 - INFO - __main__ - Step 8433: {'lr': 0.0004976734967945217, 'samples': 1619136, 'steps': 8432, 'loss/train': 1.724574327468872} +11/06/2021 22:25:29 - INFO - __main__ - Step 8434: {'lr': 0.0004976727744476593, 'samples': 1619328, 'steps': 8433, 'loss/train': 2.225064516067505} +11/06/2021 22:25:29 - INFO - __main__ - Step 8435: {'lr': 0.0004976720519891994, 'samples': 1619520, 'steps': 8434, 'loss/train': 1.7268136739730835} +11/06/2021 22:25:30 - INFO - __main__ - Step 8436: {'lr': 0.0004976713294191423, 'samples': 1619712, 'steps': 8435, 'loss/train': 1.76718270778656} +11/06/2021 22:25:30 - INFO - __main__ - Step 8437: {'lr': 0.0004976706067374885, 'samples': 1619904, 'steps': 8436, 'loss/train': 1.7768479585647583} +11/06/2021 22:25:31 - INFO - __main__ - Step 8438: {'lr': 0.0004976698839442379, 'samples': 1620096, 'steps': 8437, 'loss/train': 1.0732344388961792} +11/06/2021 22:25:31 - INFO - __main__ - Step 8439: {'lr': 0.0004976691610393911, 'samples': 1620288, 'steps': 8438, 'loss/train': 2.1499216556549072} +11/06/2021 22:25:32 - INFO - __main__ - Step 8440: {'lr': 0.0004976684380229485, 'samples': 1620480, 'steps': 8439, 'loss/train': 1.8291432857513428} +11/06/2021 22:25:32 - INFO - __main__ - Step 8441: {'lr': 0.0004976677148949102, 'samples': 1620672, 'steps': 8440, 'loss/train': 1.7826381921768188} +11/06/2021 22:25:33 - INFO - __main__ - Step 8442: {'lr': 0.0004976669916552768, 'samples': 1620864, 'steps': 8441, 'loss/train': 1.9281136989593506} +11/06/2021 22:25:33 - INFO - __main__ - Step 8443: {'lr': 0.0004976662683040484, 'samples': 1621056, 'steps': 8442, 'loss/train': 1.7835140228271484} +11/06/2021 22:25:33 - INFO - __main__ - Step 8444: {'lr': 0.0004976655448412254, 'samples': 1621248, 'steps': 8443, 'loss/train': 2.6480824947357178} +11/06/2021 22:25:34 - INFO - __main__ - Step 8445: {'lr': 0.0004976648212668081, 'samples': 1621440, 'steps': 8444, 'loss/train': 1.505518913269043} +11/06/2021 22:25:35 - INFO - __main__ - Step 8446: {'lr': 0.0004976640975807969, 'samples': 1621632, 'steps': 8445, 'loss/train': 1.532829761505127} +11/06/2021 22:25:35 - INFO - __main__ - Step 8447: {'lr': 0.0004976633737831921, 'samples': 1621824, 'steps': 8446, 'loss/train': 1.6985620260238647} +11/06/2021 22:25:35 - INFO - __main__ - Step 8448: {'lr': 0.000497662649873994, 'samples': 1622016, 'steps': 8447, 'loss/train': 1.2889354228973389} +11/06/2021 22:25:36 - INFO - __main__ - Step 8449: {'lr': 0.0004976619258532029, 'samples': 1622208, 'steps': 8448, 'loss/train': 1.8851784467697144} +11/06/2021 22:25:37 - INFO - __main__ - Step 8450: {'lr': 0.0004976612017208191, 'samples': 1622400, 'steps': 8449, 'loss/train': 2.305765151977539} +11/06/2021 22:25:37 - INFO - __main__ - Step 8451: {'lr': 0.000497660477476843, 'samples': 1622592, 'steps': 8450, 'loss/train': 1.9551142454147339} +11/06/2021 22:25:37 - INFO - __main__ - Step 8452: {'lr': 0.000497659753121275, 'samples': 1622784, 'steps': 8451, 'loss/train': 2.0676944255828857} +11/06/2021 22:25:38 - INFO - __main__ - Step 8453: {'lr': 0.0004976590286541152, 'samples': 1622976, 'steps': 8452, 'loss/train': 1.929355502128601} +11/06/2021 22:25:38 - INFO - __main__ - Step 8454: {'lr': 0.0004976583040753643, 'samples': 1623168, 'steps': 8453, 'loss/train': 1.959873080253601} +11/06/2021 22:25:39 - INFO - __main__ - Step 8455: {'lr': 0.0004976575793850223, 'samples': 1623360, 'steps': 8454, 'loss/train': 1.7598445415496826} +11/06/2021 22:25:40 - INFO - __main__ - Step 8456: {'lr': 0.0004976568545830894, 'samples': 1623552, 'steps': 8455, 'loss/train': 1.6411019563674927} +11/06/2021 22:25:40 - INFO - __main__ - Step 8457: {'lr': 0.0004976561296695663, 'samples': 1623744, 'steps': 8456, 'loss/train': 1.8063533306121826} +11/06/2021 22:25:40 - INFO - __main__ - Step 8458: {'lr': 0.0004976554046444532, 'samples': 1623936, 'steps': 8457, 'loss/train': 1.4065788984298706} +11/06/2021 22:25:41 - INFO - __main__ - Step 8459: {'lr': 0.0004976546795077503, 'samples': 1624128, 'steps': 8458, 'loss/train': 2.1664505004882812} +11/06/2021 22:25:42 - INFO - __main__ - Step 8460: {'lr': 0.0004976539542594582, 'samples': 1624320, 'steps': 8459, 'loss/train': 1.423108458518982} +11/06/2021 22:25:42 - INFO - __main__ - Step 8461: {'lr': 0.0004976532288995768, 'samples': 1624512, 'steps': 8460, 'loss/train': 1.727888822555542} +11/06/2021 22:25:42 - INFO - __main__ - Step 8462: {'lr': 0.0004976525034281069, 'samples': 1624704, 'steps': 8461, 'loss/train': 1.7131630182266235} +11/06/2021 22:25:43 - INFO - __main__ - Step 8463: {'lr': 0.0004976517778450486, 'samples': 1624896, 'steps': 8462, 'loss/train': 1.9994878768920898} +11/06/2021 22:25:43 - INFO - __main__ - Step 8464: {'lr': 0.000497651052150402, 'samples': 1625088, 'steps': 8463, 'loss/train': 1.3184614181518555} +11/06/2021 22:25:44 - INFO - __main__ - Step 8465: {'lr': 0.0004976503263441679, 'samples': 1625280, 'steps': 8464, 'loss/train': 1.885838270187378} +11/06/2021 22:25:44 - INFO - __main__ - Step 8466: {'lr': 0.0004976496004263463, 'samples': 1625472, 'steps': 8465, 'loss/train': 1.80532968044281} +11/06/2021 22:25:45 - INFO - __main__ - Step 8467: {'lr': 0.0004976488743969376, 'samples': 1625664, 'steps': 8466, 'loss/train': 1.5060994625091553} +11/06/2021 22:25:45 - INFO - __main__ - Step 8468: {'lr': 0.0004976481482559421, 'samples': 1625856, 'steps': 8467, 'loss/train': 1.5242974758148193} +11/06/2021 22:25:46 - INFO - __main__ - Step 8469: {'lr': 0.0004976474220033602, 'samples': 1626048, 'steps': 8468, 'loss/train': 1.838634729385376} +11/06/2021 22:25:46 - INFO - __main__ - Step 8470: {'lr': 0.0004976466956391922, 'samples': 1626240, 'steps': 8469, 'loss/train': 1.2237740755081177} +11/06/2021 22:25:47 - INFO - __main__ - Step 8471: {'lr': 0.0004976459691634384, 'samples': 1626432, 'steps': 8470, 'loss/train': 1.4460675716400146} +11/06/2021 22:25:47 - INFO - __main__ - Step 8472: {'lr': 0.0004976452425760992, 'samples': 1626624, 'steps': 8471, 'loss/train': 2.1150126457214355} +11/06/2021 22:25:48 - INFO - __main__ - Step 8473: {'lr': 0.0004976445158771748, 'samples': 1626816, 'steps': 8472, 'loss/train': 1.7219116687774658} +11/06/2021 22:25:48 - INFO - __main__ - Step 8474: {'lr': 0.0004976437890666657, 'samples': 1627008, 'steps': 8473, 'loss/train': 1.7514417171478271} +11/06/2021 22:25:48 - INFO - __main__ - Step 8475: {'lr': 0.0004976430621445721, 'samples': 1627200, 'steps': 8474, 'loss/train': 1.6506552696228027} +11/06/2021 22:25:50 - INFO - __main__ - Step 8476: {'lr': 0.0004976423351108943, 'samples': 1627392, 'steps': 8475, 'loss/train': 1.3242745399475098} +11/06/2021 22:25:50 - INFO - __main__ - Step 8477: {'lr': 0.0004976416079656328, 'samples': 1627584, 'steps': 8476, 'loss/train': 2.3073718547821045} +11/06/2021 22:25:50 - INFO - __main__ - Step 8478: {'lr': 0.0004976408807087876, 'samples': 1627776, 'steps': 8477, 'loss/train': 1.0934592485427856} +11/06/2021 22:25:51 - INFO - __main__ - Step 8479: {'lr': 0.0004976401533403594, 'samples': 1627968, 'steps': 8478, 'loss/train': 1.5833334922790527} +11/06/2021 22:25:51 - INFO - __main__ - Step 8480: {'lr': 0.0004976394258603484, 'samples': 1628160, 'steps': 8479, 'loss/train': 1.3912901878356934} +11/06/2021 22:25:52 - INFO - __main__ - Step 8481: {'lr': 0.0004976386982687549, 'samples': 1628352, 'steps': 8480, 'loss/train': 1.8894435167312622} +11/06/2021 22:25:52 - INFO - __main__ - Step 8482: {'lr': 0.0004976379705655791, 'samples': 1628544, 'steps': 8481, 'loss/train': 1.7393689155578613} +11/06/2021 22:25:53 - INFO - __main__ - Step 8483: {'lr': 0.0004976372427508215, 'samples': 1628736, 'steps': 8482, 'loss/train': 1.9663249254226685} +11/06/2021 22:25:53 - INFO - __main__ - Step 8484: {'lr': 0.0004976365148244824, 'samples': 1628928, 'steps': 8483, 'loss/train': 2.2855916023254395} +11/06/2021 22:25:53 - INFO - __main__ - Step 8485: {'lr': 0.0004976357867865621, 'samples': 1629120, 'steps': 8484, 'loss/train': 1.8762072324752808} +11/06/2021 22:25:54 - INFO - __main__ - Step 8486: {'lr': 0.0004976350586370609, 'samples': 1629312, 'steps': 8485, 'loss/train': 1.8550057411193848} +11/06/2021 22:25:55 - INFO - __main__ - Step 8487: {'lr': 0.0004976343303759792, 'samples': 1629504, 'steps': 8486, 'loss/train': 1.618645191192627} +11/06/2021 22:25:55 - INFO - __main__ - Step 8488: {'lr': 0.0004976336020033174, 'samples': 1629696, 'steps': 8487, 'loss/train': 1.672871470451355} +11/06/2021 22:25:55 - INFO - __main__ - Step 8489: {'lr': 0.0004976328735190755, 'samples': 1629888, 'steps': 8488, 'loss/train': 1.8050670623779297} +11/06/2021 22:25:56 - INFO - __main__ - Step 8490: {'lr': 0.0004976321449232542, 'samples': 1630080, 'steps': 8489, 'loss/train': 1.4703295230865479} +11/06/2021 22:25:56 - INFO - __main__ - Step 8491: {'lr': 0.0004976314162158536, 'samples': 1630272, 'steps': 8490, 'loss/train': 1.5319691896438599} +11/06/2021 22:25:57 - INFO - __main__ - Step 8492: {'lr': 0.0004976306873968741, 'samples': 1630464, 'steps': 8491, 'loss/train': 1.876915454864502} +11/06/2021 22:25:57 - INFO - __main__ - Step 8493: {'lr': 0.0004976299584663161, 'samples': 1630656, 'steps': 8492, 'loss/train': 1.787011981010437} +11/06/2021 22:25:58 - INFO - __main__ - Step 8494: {'lr': 0.0004976292294241798, 'samples': 1630848, 'steps': 8493, 'loss/train': 1.3954660892486572} +11/06/2021 22:25:58 - INFO - __main__ - Step 8495: {'lr': 0.0004976285002704656, 'samples': 1631040, 'steps': 8494, 'loss/train': 2.078723669052124} +11/06/2021 22:25:59 - INFO - __main__ - Step 8496: {'lr': 0.0004976277710051739, 'samples': 1631232, 'steps': 8495, 'loss/train': 2.3327043056488037} +11/06/2021 22:26:00 - INFO - __main__ - Step 8497: {'lr': 0.0004976270416283049, 'samples': 1631424, 'steps': 8496, 'loss/train': 1.9234745502471924} +11/06/2021 22:26:00 - INFO - __main__ - Step 8498: {'lr': 0.000497626312139859, 'samples': 1631616, 'steps': 8497, 'loss/train': 1.7845796346664429} +11/06/2021 22:26:00 - INFO - __main__ - Step 8499: {'lr': 0.0004976255825398365, 'samples': 1631808, 'steps': 8498, 'loss/train': 2.1495463848114014} +11/06/2021 22:26:01 - INFO - __main__ - Step 8500: {'lr': 0.0004976248528282376, 'samples': 1632000, 'steps': 8499, 'loss/train': 2.1509108543395996} +11/06/2021 22:26:01 - INFO - __main__ - Step 8501: {'lr': 0.000497624123005063, 'samples': 1632192, 'steps': 8500, 'loss/train': 1.78944993019104} +11/06/2021 22:26:02 - INFO - __main__ - Step 8502: {'lr': 0.0004976233930703126, 'samples': 1632384, 'steps': 8501, 'loss/train': 1.7581290006637573} +11/06/2021 22:26:02 - INFO - __main__ - Step 8503: {'lr': 0.000497622663023987, 'samples': 1632576, 'steps': 8502, 'loss/train': 1.6255358457565308} +11/06/2021 22:26:03 - INFO - __main__ - Step 8504: {'lr': 0.0004976219328660864, 'samples': 1632768, 'steps': 8503, 'loss/train': 1.977895975112915} +11/06/2021 22:26:03 - INFO - __main__ - Step 8505: {'lr': 0.0004976212025966112, 'samples': 1632960, 'steps': 8504, 'loss/train': 3.297560453414917} +11/06/2021 22:26:03 - INFO - __main__ - Step 8506: {'lr': 0.0004976204722155617, 'samples': 1633152, 'steps': 8505, 'loss/train': 1.7833354473114014} +11/06/2021 22:26:05 - INFO - __main__ - Step 8507: {'lr': 0.0004976197417229383, 'samples': 1633344, 'steps': 8506, 'loss/train': 1.4364817142486572} +11/06/2021 22:26:05 - INFO - __main__ - Step 8508: {'lr': 0.0004976190111187412, 'samples': 1633536, 'steps': 8507, 'loss/train': 2.1614036560058594} +11/06/2021 22:26:05 - INFO - __main__ - Step 8509: {'lr': 0.0004976182804029708, 'samples': 1633728, 'steps': 8508, 'loss/train': 1.8485922813415527} +11/06/2021 22:26:06 - INFO - __main__ - Step 8510: {'lr': 0.0004976175495756274, 'samples': 1633920, 'steps': 8509, 'loss/train': 1.9994100332260132} +11/06/2021 22:26:06 - INFO - __main__ - Step 8511: {'lr': 0.0004976168186367115, 'samples': 1634112, 'steps': 8510, 'loss/train': 1.4582551717758179} +11/06/2021 22:26:07 - INFO - __main__ - Step 8512: {'lr': 0.0004976160875862231, 'samples': 1634304, 'steps': 8511, 'loss/train': 1.6600501537322998} +11/06/2021 22:26:07 - INFO - __main__ - Step 8513: {'lr': 0.0004976153564241628, 'samples': 1634496, 'steps': 8512, 'loss/train': 1.6046333312988281} +11/06/2021 22:26:08 - INFO - __main__ - Step 8514: {'lr': 0.0004976146251505309, 'samples': 1634688, 'steps': 8513, 'loss/train': 2.3201334476470947} +11/06/2021 22:26:08 - INFO - __main__ - Step 8515: {'lr': 0.0004976138937653275, 'samples': 1634880, 'steps': 8514, 'loss/train': 1.6256712675094604} +11/06/2021 22:26:08 - INFO - __main__ - Step 8516: {'lr': 0.0004976131622685532, 'samples': 1635072, 'steps': 8515, 'loss/train': 1.8171868324279785} +11/06/2021 22:26:09 - INFO - __main__ - Step 8517: {'lr': 0.0004976124306602083, 'samples': 1635264, 'steps': 8516, 'loss/train': 1.7854278087615967} +11/06/2021 22:26:10 - INFO - __main__ - Step 8518: {'lr': 0.0004976116989402929, 'samples': 1635456, 'steps': 8517, 'loss/train': 1.7013543844223022} +11/06/2021 22:26:10 - INFO - __main__ - Step 8519: {'lr': 0.0004976109671088076, 'samples': 1635648, 'steps': 8518, 'loss/train': 1.9890172481536865} +11/06/2021 22:26:10 - INFO - __main__ - Step 8520: {'lr': 0.0004976102351657526, 'samples': 1635840, 'steps': 8519, 'loss/train': 1.8006373643875122} +11/06/2021 22:26:11 - INFO - __main__ - Step 8521: {'lr': 0.0004976095031111283, 'samples': 1636032, 'steps': 8520, 'loss/train': 1.9364084005355835} +11/06/2021 22:26:11 - INFO - __main__ - Step 8522: {'lr': 0.0004976087709449348, 'samples': 1636224, 'steps': 8521, 'loss/train': 1.6207133531570435} +11/06/2021 22:26:12 - INFO - __main__ - Step 8523: {'lr': 0.0004976080386671728, 'samples': 1636416, 'steps': 8522, 'loss/train': 2.250715732574463} +11/06/2021 22:26:13 - INFO - __main__ - Step 8524: {'lr': 0.0004976073062778423, 'samples': 1636608, 'steps': 8523, 'loss/train': 1.8443859815597534} +11/06/2021 22:26:13 - INFO - __main__ - Step 8525: {'lr': 0.0004976065737769439, 'samples': 1636800, 'steps': 8524, 'loss/train': 0.9607848525047302} +11/06/2021 22:26:13 - INFO - __main__ - Step 8526: {'lr': 0.0004976058411644777, 'samples': 1636992, 'steps': 8525, 'loss/train': 1.7340941429138184} +11/06/2021 22:26:14 - INFO - __main__ - Step 8527: {'lr': 0.0004976051084404443, 'samples': 1637184, 'steps': 8526, 'loss/train': 2.0823657512664795} +11/06/2021 22:26:15 - INFO - __main__ - Step 8528: {'lr': 0.0004976043756048436, 'samples': 1637376, 'steps': 8527, 'loss/train': 1.8343414068222046} +11/06/2021 22:26:15 - INFO - __main__ - Step 8529: {'lr': 0.0004976036426576763, 'samples': 1637568, 'steps': 8528, 'loss/train': 2.1914784908294678} +11/06/2021 22:26:15 - INFO - __main__ - Step 8530: {'lr': 0.0004976029095989427, 'samples': 1637760, 'steps': 8529, 'loss/train': 3.2090442180633545} +11/06/2021 22:26:16 - INFO - __main__ - Step 8531: {'lr': 0.000497602176428643, 'samples': 1637952, 'steps': 8530, 'loss/train': 2.355168342590332} +11/06/2021 22:26:16 - INFO - __main__ - Step 8532: {'lr': 0.0004976014431467775, 'samples': 1638144, 'steps': 8531, 'loss/train': 1.1861897706985474} +11/06/2021 22:26:17 - INFO - __main__ - Step 8533: {'lr': 0.0004976007097533467, 'samples': 1638336, 'steps': 8532, 'loss/train': 2.105987071990967} +11/06/2021 22:26:17 - INFO - __main__ - Step 8534: {'lr': 0.0004975999762483509, 'samples': 1638528, 'steps': 8533, 'loss/train': 1.797425389289856} +11/06/2021 22:26:18 - INFO - __main__ - Step 8535: {'lr': 0.0004975992426317902, 'samples': 1638720, 'steps': 8534, 'loss/train': 1.2677090167999268} +11/06/2021 22:26:18 - INFO - __main__ - Step 8536: {'lr': 0.0004975985089036652, 'samples': 1638912, 'steps': 8535, 'loss/train': 1.7440499067306519} +11/06/2021 22:26:18 - INFO - __main__ - Step 8537: {'lr': 0.0004975977750639761, 'samples': 1639104, 'steps': 8536, 'loss/train': 3.189857244491577} +11/06/2021 22:26:19 - INFO - __main__ - Step 8538: {'lr': 0.0004975970411127233, 'samples': 1639296, 'steps': 8537, 'loss/train': 1.8964868783950806} +11/06/2021 22:26:20 - INFO - __main__ - Step 8539: {'lr': 0.0004975963070499071, 'samples': 1639488, 'steps': 8538, 'loss/train': 2.1125876903533936} +11/06/2021 22:26:20 - INFO - __main__ - Step 8540: {'lr': 0.0004975955728755277, 'samples': 1639680, 'steps': 8539, 'loss/train': 1.6929922103881836} +11/06/2021 22:26:21 - INFO - __main__ - Step 8541: {'lr': 0.0004975948385895858, 'samples': 1639872, 'steps': 8540, 'loss/train': 1.6374714374542236} +11/06/2021 22:26:21 - INFO - __main__ - Step 8542: {'lr': 0.0004975941041920813, 'samples': 1640064, 'steps': 8541, 'loss/train': 2.006967067718506} +11/06/2021 22:26:22 - INFO - __main__ - Step 8543: {'lr': 0.0004975933696830147, 'samples': 1640256, 'steps': 8542, 'loss/train': 1.9213240146636963} +11/06/2021 22:26:22 - INFO - __main__ - Step 8544: {'lr': 0.0004975926350623864, 'samples': 1640448, 'steps': 8543, 'loss/train': 2.296802043914795} +11/06/2021 22:26:23 - INFO - __main__ - Step 8545: {'lr': 0.0004975919003301967, 'samples': 1640640, 'steps': 8544, 'loss/train': 1.7071173191070557} +11/06/2021 22:26:23 - INFO - __main__ - Step 8546: {'lr': 0.0004975911654864459, 'samples': 1640832, 'steps': 8545, 'loss/train': 2.5078957080841064} +11/06/2021 22:26:23 - INFO - __main__ - Step 8547: {'lr': 0.0004975904305311344, 'samples': 1641024, 'steps': 8546, 'loss/train': 2.413429021835327} +11/06/2021 22:26:25 - INFO - __main__ - Step 8548: {'lr': 0.0004975896954642623, 'samples': 1641216, 'steps': 8547, 'loss/train': 1.545986294746399} +11/06/2021 22:26:25 - INFO - __main__ - Step 8549: {'lr': 0.0004975889602858303, 'samples': 1641408, 'steps': 8548, 'loss/train': 1.858424425125122} +11/06/2021 22:26:26 - INFO - __main__ - Step 8550: {'lr': 0.0004975882249958385, 'samples': 1641600, 'steps': 8549, 'loss/train': 2.576998472213745} +11/06/2021 22:26:26 - INFO - __main__ - Step 8551: {'lr': 0.0004975874895942872, 'samples': 1641792, 'steps': 8550, 'loss/train': 1.2816332578659058} +11/06/2021 22:26:26 - INFO - __main__ - Step 8552: {'lr': 0.0004975867540811768, 'samples': 1641984, 'steps': 8551, 'loss/train': 1.6916189193725586} +11/06/2021 22:26:27 - INFO - __main__ - Step 8553: {'lr': 0.0004975860184565076, 'samples': 1642176, 'steps': 8552, 'loss/train': 1.8677070140838623} +11/06/2021 22:26:27 - INFO - __main__ - Step 8554: {'lr': 0.0004975852827202801, 'samples': 1642368, 'steps': 8553, 'loss/train': 1.7044568061828613} +11/06/2021 22:26:28 - INFO - __main__ - Step 8555: {'lr': 0.0004975845468724944, 'samples': 1642560, 'steps': 8554, 'loss/train': 1.236737847328186} +11/06/2021 22:26:29 - INFO - __main__ - Step 8556: {'lr': 0.0004975838109131509, 'samples': 1642752, 'steps': 8555, 'loss/train': 1.6801140308380127} +11/06/2021 22:26:29 - INFO - __main__ - Step 8557: {'lr': 0.0004975830748422499, 'samples': 1642944, 'steps': 8556, 'loss/train': 1.9419505596160889} +11/06/2021 22:26:29 - INFO - __main__ - Step 8558: {'lr': 0.0004975823386597918, 'samples': 1643136, 'steps': 8557, 'loss/train': 1.7988413572311401} +11/06/2021 22:26:30 - INFO - __main__ - Step 8559: {'lr': 0.000497581602365777, 'samples': 1643328, 'steps': 8558, 'loss/train': 2.347743511199951} +11/06/2021 22:26:30 - INFO - __main__ - Step 8560: {'lr': 0.0004975808659602058, 'samples': 1643520, 'steps': 8559, 'loss/train': 1.103050947189331} +11/06/2021 22:26:31 - INFO - __main__ - Step 8561: {'lr': 0.0004975801294430784, 'samples': 1643712, 'steps': 8560, 'loss/train': 2.005465030670166} +11/06/2021 22:26:31 - INFO - __main__ - Step 8562: {'lr': 0.0004975793928143952, 'samples': 1643904, 'steps': 8561, 'loss/train': 1.6958545446395874} +11/06/2021 22:26:32 - INFO - __main__ - Step 8563: {'lr': 0.0004975786560741566, 'samples': 1644096, 'steps': 8562, 'loss/train': 1.6469171047210693} +11/06/2021 22:26:32 - INFO - __main__ - Step 8564: {'lr': 0.0004975779192223629, 'samples': 1644288, 'steps': 8563, 'loss/train': 1.7488797903060913} +11/06/2021 22:26:32 - INFO - __main__ - Step 8565: {'lr': 0.0004975771822590143, 'samples': 1644480, 'steps': 8564, 'loss/train': 1.531661868095398} +11/06/2021 22:26:33 - INFO - __main__ - Step 8566: {'lr': 0.0004975764451841114, 'samples': 1644672, 'steps': 8565, 'loss/train': 1.9583240747451782} +11/06/2021 22:26:34 - INFO - __main__ - Step 8567: {'lr': 0.0004975757079976542, 'samples': 1644864, 'steps': 8566, 'loss/train': 2.6760129928588867} +11/06/2021 22:26:34 - INFO - __main__ - Step 8568: {'lr': 0.0004975749706996433, 'samples': 1645056, 'steps': 8567, 'loss/train': 1.9086993932724} +11/06/2021 22:26:34 - INFO - __main__ - Step 8569: {'lr': 0.0004975742332900789, 'samples': 1645248, 'steps': 8568, 'loss/train': 1.3222005367279053} +11/06/2021 22:26:35 - INFO - __main__ - Step 8570: {'lr': 0.0004975734957689614, 'samples': 1645440, 'steps': 8569, 'loss/train': 2.3594229221343994} +11/06/2021 22:26:36 - INFO - __main__ - Step 8571: {'lr': 0.0004975727581362911, 'samples': 1645632, 'steps': 8570, 'loss/train': 1.3136167526245117} +11/06/2021 22:26:36 - INFO - __main__ - Step 8572: {'lr': 0.0004975720203920683, 'samples': 1645824, 'steps': 8571, 'loss/train': 2.3485770225524902} +11/06/2021 22:26:36 - INFO - __main__ - Step 8573: {'lr': 0.0004975712825362934, 'samples': 1646016, 'steps': 8572, 'loss/train': 2.9186878204345703} +11/06/2021 22:26:37 - INFO - __main__ - Step 8574: {'lr': 0.0004975705445689668, 'samples': 1646208, 'steps': 8573, 'loss/train': 1.8523027896881104} +11/06/2021 22:26:37 - INFO - __main__ - Step 8575: {'lr': 0.0004975698064900886, 'samples': 1646400, 'steps': 8574, 'loss/train': 2.420170783996582} +11/06/2021 22:26:38 - INFO - __main__ - Step 8576: {'lr': 0.0004975690682996592, 'samples': 1646592, 'steps': 8575, 'loss/train': 1.9467846155166626} +11/06/2021 22:26:38 - INFO - __main__ - Step 8577: {'lr': 0.0004975683299976791, 'samples': 1646784, 'steps': 8576, 'loss/train': 1.946389079093933} +11/06/2021 22:26:39 - INFO - __main__ - Step 8578: {'lr': 0.0004975675915841485, 'samples': 1646976, 'steps': 8577, 'loss/train': 2.061795711517334} +11/06/2021 22:26:39 - INFO - __main__ - Step 8579: {'lr': 0.0004975668530590679, 'samples': 1647168, 'steps': 8578, 'loss/train': 2.067392110824585} +11/06/2021 22:26:40 - INFO - __main__ - Step 8580: {'lr': 0.0004975661144224374, 'samples': 1647360, 'steps': 8579, 'loss/train': 2.0112924575805664} +11/06/2021 22:26:41 - INFO - __main__ - Step 8581: {'lr': 0.0004975653756742574, 'samples': 1647552, 'steps': 8580, 'loss/train': 1.770460605621338} +11/06/2021 22:26:42 - INFO - __main__ - Step 8582: {'lr': 0.0004975646368145282, 'samples': 1647744, 'steps': 8581, 'loss/train': 2.0862138271331787} +11/06/2021 22:26:42 - INFO - __main__ - Step 8583: {'lr': 0.0004975638978432503, 'samples': 1647936, 'steps': 8582, 'loss/train': 1.6407994031906128} +11/06/2021 22:26:42 - INFO - __main__ - Step 8584: {'lr': 0.0004975631587604239, 'samples': 1648128, 'steps': 8583, 'loss/train': 1.8305928707122803} +11/06/2021 22:26:43 - INFO - __main__ - Step 8585: {'lr': 0.0004975624195660494, 'samples': 1648320, 'steps': 8584, 'loss/train': 1.8244094848632812} +11/06/2021 22:26:43 - INFO - __main__ - Step 8586: {'lr': 0.0004975616802601271, 'samples': 1648512, 'steps': 8585, 'loss/train': 1.8164951801300049} +11/06/2021 22:26:44 - INFO - __main__ - Step 8587: {'lr': 0.0004975609408426572, 'samples': 1648704, 'steps': 8586, 'loss/train': 1.84238600730896} +11/06/2021 22:26:45 - INFO - __main__ - Step 8588: {'lr': 0.0004975602013136403, 'samples': 1648896, 'steps': 8587, 'loss/train': 1.9760645627975464} +11/06/2021 22:26:45 - INFO - __main__ - Step 8589: {'lr': 0.0004975594616730766, 'samples': 1649088, 'steps': 8588, 'loss/train': 1.6991413831710815} +11/06/2021 22:26:45 - INFO - __main__ - Step 8590: {'lr': 0.0004975587219209663, 'samples': 1649280, 'steps': 8589, 'loss/train': 1.3211325407028198} +11/06/2021 22:26:46 - INFO - __main__ - Step 8591: {'lr': 0.0004975579820573099, 'samples': 1649472, 'steps': 8590, 'loss/train': 1.5335558652877808} +11/06/2021 22:26:46 - INFO - __main__ - Step 8592: {'lr': 0.0004975572420821078, 'samples': 1649664, 'steps': 8591, 'loss/train': 1.8905811309814453} +11/06/2021 22:26:47 - INFO - __main__ - Step 8593: {'lr': 0.0004975565019953601, 'samples': 1649856, 'steps': 8592, 'loss/train': 1.5297328233718872} +11/06/2021 22:26:47 - INFO - __main__ - Step 8594: {'lr': 0.0004975557617970673, 'samples': 1650048, 'steps': 8593, 'loss/train': 1.714114785194397} +11/06/2021 22:26:48 - INFO - __main__ - Step 8595: {'lr': 0.0004975550214872296, 'samples': 1650240, 'steps': 8594, 'loss/train': 1.8319971561431885} +11/06/2021 22:26:48 - INFO - __main__ - Step 8596: {'lr': 0.0004975542810658476, 'samples': 1650432, 'steps': 8595, 'loss/train': 1.850310206413269} +11/06/2021 22:26:48 - INFO - __main__ - Step 8597: {'lr': 0.0004975535405329213, 'samples': 1650624, 'steps': 8596, 'loss/train': 1.9651538133621216} +11/06/2021 22:26:49 - INFO - __main__ - Step 8598: {'lr': 0.0004975527998884513, 'samples': 1650816, 'steps': 8597, 'loss/train': 1.1798516511917114} +11/06/2021 22:26:50 - INFO - __main__ - Step 8599: {'lr': 0.0004975520591324378, 'samples': 1651008, 'steps': 8598, 'loss/train': 1.6260879039764404} +11/06/2021 22:26:51 - INFO - __main__ - Step 8600: {'lr': 0.0004975513182648812, 'samples': 1651200, 'steps': 8599, 'loss/train': 1.9237269163131714} +11/06/2021 22:26:51 - INFO - __main__ - Step 8601: {'lr': 0.0004975505772857818, 'samples': 1651392, 'steps': 8600, 'loss/train': 1.373760461807251} +11/06/2021 22:26:51 - INFO - __main__ - Step 8602: {'lr': 0.0004975498361951398, 'samples': 1651584, 'steps': 8601, 'loss/train': 1.5592304468154907} +11/06/2021 22:26:52 - INFO - __main__ - Step 8603: {'lr': 0.0004975490949929558, 'samples': 1651776, 'steps': 8602, 'loss/train': 1.782822608947754} +11/06/2021 22:26:53 - INFO - __main__ - Step 8604: {'lr': 0.00049754835367923, 'samples': 1651968, 'steps': 8603, 'loss/train': 1.2513318061828613} +11/06/2021 22:26:53 - INFO - __main__ - Step 8605: {'lr': 0.0004975476122539627, 'samples': 1652160, 'steps': 8604, 'loss/train': 1.4960685968399048} +11/06/2021 22:26:53 - INFO - __main__ - Step 8606: {'lr': 0.0004975468707171542, 'samples': 1652352, 'steps': 8605, 'loss/train': 1.4390000104904175} +11/06/2021 22:26:54 - INFO - __main__ - Step 8607: {'lr': 0.000497546129068805, 'samples': 1652544, 'steps': 8606, 'loss/train': 1.4670497179031372} +11/06/2021 22:26:54 - INFO - __main__ - Step 8608: {'lr': 0.0004975453873089153, 'samples': 1652736, 'steps': 8607, 'loss/train': 2.2388570308685303} +11/06/2021 22:26:55 - INFO - __main__ - Step 8609: {'lr': 0.0004975446454374854, 'samples': 1652928, 'steps': 8608, 'loss/train': 1.8201464414596558} +11/06/2021 22:26:55 - INFO - __main__ - Step 8610: {'lr': 0.0004975439034545158, 'samples': 1653120, 'steps': 8609, 'loss/train': 1.0466943979263306} +11/06/2021 22:26:56 - INFO - __main__ - Step 8611: {'lr': 0.0004975431613600067, 'samples': 1653312, 'steps': 8610, 'loss/train': 1.8127079010009766} +11/06/2021 22:26:56 - INFO - __main__ - Step 8612: {'lr': 0.0004975424191539585, 'samples': 1653504, 'steps': 8611, 'loss/train': 1.8894764184951782} +11/06/2021 22:26:57 - INFO - __main__ - Step 8613: {'lr': 0.0004975416768363715, 'samples': 1653696, 'steps': 8612, 'loss/train': 1.5986841917037964} +11/06/2021 22:26:57 - INFO - __main__ - Step 8614: {'lr': 0.0004975409344072459, 'samples': 1653888, 'steps': 8613, 'loss/train': 1.9542250633239746} +11/06/2021 22:26:58 - INFO - __main__ - Step 8615: {'lr': 0.0004975401918665823, 'samples': 1654080, 'steps': 8614, 'loss/train': 1.8345215320587158} +11/06/2021 22:26:58 - INFO - __main__ - Step 8616: {'lr': 0.0004975394492143808, 'samples': 1654272, 'steps': 8615, 'loss/train': 2.525263547897339} +11/06/2021 22:26:59 - INFO - __main__ - Step 8617: {'lr': 0.0004975387064506421, 'samples': 1654464, 'steps': 8616, 'loss/train': 1.956400752067566} +11/06/2021 22:26:59 - INFO - __main__ - Step 8618: {'lr': 0.000497537963575366, 'samples': 1654656, 'steps': 8617, 'loss/train': 1.734102725982666} +11/06/2021 22:26:59 - INFO - __main__ - Step 8619: {'lr': 0.0004975372205885533, 'samples': 1654848, 'steps': 8618, 'loss/train': 1.9009313583374023} +11/06/2021 22:27:00 - INFO - __main__ - Step 8620: {'lr': 0.0004975364774902041, 'samples': 1655040, 'steps': 8619, 'loss/train': 2.392646551132202} +11/06/2021 22:27:01 - INFO - __main__ - Step 8621: {'lr': 0.0004975357342803187, 'samples': 1655232, 'steps': 8620, 'loss/train': 1.483763575553894} +11/06/2021 22:27:01 - INFO - __main__ - Step 8622: {'lr': 0.0004975349909588976, 'samples': 1655424, 'steps': 8621, 'loss/train': 1.836098313331604} +11/06/2021 22:27:02 - INFO - __main__ - Step 8623: {'lr': 0.000497534247525941, 'samples': 1655616, 'steps': 8622, 'loss/train': 1.932421326637268} +11/06/2021 22:27:02 - INFO - __main__ - Step 8624: {'lr': 0.0004975335039814493, 'samples': 1655808, 'steps': 8623, 'loss/train': 1.0708638429641724} +11/06/2021 22:27:03 - INFO - __main__ - Step 8625: {'lr': 0.0004975327603254229, 'samples': 1656000, 'steps': 8624, 'loss/train': 1.1579554080963135} +11/06/2021 22:27:03 - INFO - __main__ - Step 8626: {'lr': 0.000497532016557862, 'samples': 1656192, 'steps': 8625, 'loss/train': 1.4248061180114746} +11/06/2021 22:27:04 - INFO - __main__ - Step 8627: {'lr': 0.0004975312726787671, 'samples': 1656384, 'steps': 8626, 'loss/train': 2.444399833679199} +11/06/2021 22:27:04 - INFO - __main__ - Step 8628: {'lr': 0.0004975305286881383, 'samples': 1656576, 'steps': 8627, 'loss/train': 1.7895426750183105} +11/06/2021 22:27:04 - INFO - __main__ - Step 8629: {'lr': 0.0004975297845859761, 'samples': 1656768, 'steps': 8628, 'loss/train': 1.8516370058059692} +11/06/2021 22:27:05 - INFO - __main__ - Step 8630: {'lr': 0.0004975290403722807, 'samples': 1656960, 'steps': 8629, 'loss/train': 1.1760151386260986} +11/06/2021 22:27:06 - INFO - __main__ - Step 8631: {'lr': 0.0004975282960470527, 'samples': 1657152, 'steps': 8630, 'loss/train': 0.9543409943580627} +11/06/2021 22:27:06 - INFO - __main__ - Step 8632: {'lr': 0.0004975275516102922, 'samples': 1657344, 'steps': 8631, 'loss/train': 1.7859746217727661} +11/06/2021 22:27:06 - INFO - __main__ - Step 8633: {'lr': 0.0004975268070619996, 'samples': 1657536, 'steps': 8632, 'loss/train': 1.8400938510894775} +11/06/2021 22:27:07 - INFO - __main__ - Step 8634: {'lr': 0.0004975260624021752, 'samples': 1657728, 'steps': 8633, 'loss/train': 1.3847429752349854} +11/06/2021 22:27:07 - INFO - __main__ - Step 8635: {'lr': 0.0004975253176308194, 'samples': 1657920, 'steps': 8634, 'loss/train': 1.8140875101089478} +11/06/2021 22:27:08 - INFO - __main__ - Step 8636: {'lr': 0.0004975245727479325, 'samples': 1658112, 'steps': 8635, 'loss/train': 1.8529094457626343} +11/06/2021 22:27:09 - INFO - __main__ - Step 8637: {'lr': 0.0004975238277535149, 'samples': 1658304, 'steps': 8636, 'loss/train': 1.9702752828598022} +11/06/2021 22:27:09 - INFO - __main__ - Step 8638: {'lr': 0.0004975230826475669, 'samples': 1658496, 'steps': 8637, 'loss/train': 1.9060972929000854} +11/06/2021 22:27:09 - INFO - __main__ - Step 8639: {'lr': 0.0004975223374300887, 'samples': 1658688, 'steps': 8638, 'loss/train': 2.0410006046295166} +11/06/2021 22:27:10 - INFO - __main__ - Step 8640: {'lr': 0.0004975215921010808, 'samples': 1658880, 'steps': 8639, 'loss/train': 1.9541411399841309} +11/06/2021 22:27:11 - INFO - __main__ - Step 8641: {'lr': 0.0004975208466605435, 'samples': 1659072, 'steps': 8640, 'loss/train': 1.7635051012039185} +11/06/2021 22:27:12 - INFO - __main__ - Step 8642: {'lr': 0.0004975201011084773, 'samples': 1659264, 'steps': 8641, 'loss/train': 1.650898814201355} +11/06/2021 22:27:12 - INFO - __main__ - Step 8643: {'lr': 0.0004975193554448821, 'samples': 1659456, 'steps': 8642, 'loss/train': 1.8950550556182861} +11/06/2021 22:27:12 - INFO - __main__ - Step 8644: {'lr': 0.0004975186096697585, 'samples': 1659648, 'steps': 8643, 'loss/train': 2.5472521781921387} +11/06/2021 22:27:13 - INFO - __main__ - Step 8645: {'lr': 0.000497517863783107, 'samples': 1659840, 'steps': 8644, 'loss/train': 1.438095211982727} +11/06/2021 22:27:13 - INFO - __main__ - Step 8646: {'lr': 0.0004975171177849277, 'samples': 1660032, 'steps': 8645, 'loss/train': 2.031336545944214} +11/06/2021 22:27:14 - INFO - __main__ - Step 8647: {'lr': 0.000497516371675221, 'samples': 1660224, 'steps': 8646, 'loss/train': 2.2316641807556152} +11/06/2021 22:27:15 - INFO - __main__ - Step 8648: {'lr': 0.0004975156254539873, 'samples': 1660416, 'steps': 8647, 'loss/train': 2.0939579010009766} +11/06/2021 22:27:15 - INFO - __main__ - Step 8649: {'lr': 0.0004975148791212269, 'samples': 1660608, 'steps': 8648, 'loss/train': 1.8442882299423218} +11/06/2021 22:27:15 - INFO - __main__ - Step 8650: {'lr': 0.00049751413267694, 'samples': 1660800, 'steps': 8649, 'loss/train': 2.065793752670288} +11/06/2021 22:27:16 - INFO - __main__ - Step 8651: {'lr': 0.000497513386121127, 'samples': 1660992, 'steps': 8650, 'loss/train': 1.510509729385376} +11/06/2021 22:27:17 - INFO - __main__ - Step 8652: {'lr': 0.0004975126394537884, 'samples': 1661184, 'steps': 8651, 'loss/train': 1.9904800653457642} +11/06/2021 22:27:17 - INFO - __main__ - Step 8653: {'lr': 0.0004975118926749245, 'samples': 1661376, 'steps': 8652, 'loss/train': 2.4816510677337646} +11/06/2021 22:27:17 - INFO - __main__ - Step 8654: {'lr': 0.0004975111457845354, 'samples': 1661568, 'steps': 8653, 'loss/train': 1.7848095893859863} +11/06/2021 22:27:18 - INFO - __main__ - Step 8655: {'lr': 0.0004975103987826217, 'samples': 1661760, 'steps': 8654, 'loss/train': 1.5138027667999268} +11/06/2021 22:27:18 - INFO - __main__ - Step 8656: {'lr': 0.0004975096516691836, 'samples': 1661952, 'steps': 8655, 'loss/train': 2.094496965408325} +11/06/2021 22:27:19 - INFO - __main__ - Step 8657: {'lr': 0.0004975089044442215, 'samples': 1662144, 'steps': 8656, 'loss/train': 2.499422073364258} +11/06/2021 22:27:19 - INFO - __main__ - Step 8658: {'lr': 0.0004975081571077357, 'samples': 1662336, 'steps': 8657, 'loss/train': 2.3265016078948975} +11/06/2021 22:27:20 - INFO - __main__ - Step 8659: {'lr': 0.0004975074096597265, 'samples': 1662528, 'steps': 8658, 'loss/train': 1.801966905593872} +11/06/2021 22:27:20 - INFO - __main__ - Step 8660: {'lr': 0.0004975066621001943, 'samples': 1662720, 'steps': 8659, 'loss/train': 1.1997767686843872} +11/06/2021 22:27:20 - INFO - __main__ - Step 8661: {'lr': 0.0004975059144291394, 'samples': 1662912, 'steps': 8660, 'loss/train': 1.4698797464370728} +11/06/2021 22:27:21 - INFO - __main__ - Step 8662: {'lr': 0.0004975051666465622, 'samples': 1663104, 'steps': 8661, 'loss/train': 2.032155990600586} +11/06/2021 22:27:22 - INFO - __main__ - Step 8663: {'lr': 0.0004975044187524629, 'samples': 1663296, 'steps': 8662, 'loss/train': 1.661537766456604} +11/06/2021 22:27:22 - INFO - __main__ - Step 8664: {'lr': 0.000497503670746842, 'samples': 1663488, 'steps': 8663, 'loss/train': 1.3858249187469482} +11/06/2021 22:27:23 - INFO - __main__ - Step 8665: {'lr': 0.0004975029226296998, 'samples': 1663680, 'steps': 8664, 'loss/train': 2.2269275188446045} +11/06/2021 22:27:23 - INFO - __main__ - Step 8666: {'lr': 0.0004975021744010365, 'samples': 1663872, 'steps': 8665, 'loss/train': 2.003019332885742} +11/06/2021 22:27:23 - INFO - __main__ - Step 8667: {'lr': 0.0004975014260608527, 'samples': 1664064, 'steps': 8666, 'loss/train': 1.5768145322799683} +11/06/2021 22:27:24 - INFO - __main__ - Step 8668: {'lr': 0.0004975006776091484, 'samples': 1664256, 'steps': 8667, 'loss/train': 1.9532525539398193} +11/06/2021 22:27:25 - INFO - __main__ - Step 8669: {'lr': 0.0004974999290459243, 'samples': 1664448, 'steps': 8668, 'loss/train': 1.587928295135498} +11/06/2021 22:27:25 - INFO - __main__ - Step 8670: {'lr': 0.0004974991803711803, 'samples': 1664640, 'steps': 8669, 'loss/train': 1.7508021593093872} +11/06/2021 22:27:25 - INFO - __main__ - Step 8671: {'lr': 0.0004974984315849172, 'samples': 1664832, 'steps': 8670, 'loss/train': 1.5539518594741821} +11/06/2021 22:27:26 - INFO - __main__ - Step 8672: {'lr': 0.000497497682687135, 'samples': 1665024, 'steps': 8671, 'loss/train': 1.5913190841674805} +11/06/2021 22:27:27 - INFO - __main__ - Step 8673: {'lr': 0.0004974969336778343, 'samples': 1665216, 'steps': 8672, 'loss/train': 1.3758063316345215} +11/06/2021 22:27:27 - INFO - __main__ - Step 8674: {'lr': 0.0004974961845570152, 'samples': 1665408, 'steps': 8673, 'loss/train': 1.925683856010437} +11/06/2021 22:27:27 - INFO - __main__ - Step 8675: {'lr': 0.0004974954353246781, 'samples': 1665600, 'steps': 8674, 'loss/train': 1.983332872390747} +11/06/2021 22:27:28 - INFO - __main__ - Step 8676: {'lr': 0.0004974946859808235, 'samples': 1665792, 'steps': 8675, 'loss/train': 1.5062406063079834} +11/06/2021 22:27:28 - INFO - __main__ - Step 8677: {'lr': 0.0004974939365254515, 'samples': 1665984, 'steps': 8676, 'loss/train': 1.4310129880905151} +11/06/2021 22:27:29 - INFO - __main__ - Step 8678: {'lr': 0.0004974931869585626, 'samples': 1666176, 'steps': 8677, 'loss/train': 1.1025075912475586} +11/06/2021 22:27:29 - INFO - __main__ - Step 8679: {'lr': 0.0004974924372801572, 'samples': 1666368, 'steps': 8678, 'loss/train': 1.5145713090896606} +11/06/2021 22:27:30 - INFO - __main__ - Step 8680: {'lr': 0.0004974916874902353, 'samples': 1666560, 'steps': 8679, 'loss/train': 1.819180965423584} +11/06/2021 22:27:30 - INFO - __main__ - Step 8681: {'lr': 0.0004974909375887976, 'samples': 1666752, 'steps': 8680, 'loss/train': 1.7356830835342407} +11/06/2021 22:27:31 - INFO - __main__ - Step 8682: {'lr': 0.0004974901875758444, 'samples': 1666944, 'steps': 8681, 'loss/train': 2.002690315246582} +11/06/2021 22:27:31 - INFO - __main__ - Step 8683: {'lr': 0.0004974894374513757, 'samples': 1667136, 'steps': 8682, 'loss/train': 2.2562174797058105} +11/06/2021 22:27:32 - INFO - __main__ - Step 8684: {'lr': 0.0004974886872153922, 'samples': 1667328, 'steps': 8683, 'loss/train': 1.799873948097229} +11/06/2021 22:27:32 - INFO - __main__ - Step 8685: {'lr': 0.0004974879368678942, 'samples': 1667520, 'steps': 8684, 'loss/train': 2.1796953678131104} +11/06/2021 22:27:32 - INFO - __main__ - Step 8686: {'lr': 0.0004974871864088818, 'samples': 1667712, 'steps': 8685, 'loss/train': 1.7284247875213623} +11/06/2021 22:27:33 - INFO - __main__ - Step 8687: {'lr': 0.0004974864358383555, 'samples': 1667904, 'steps': 8686, 'loss/train': 2.1161437034606934} +11/06/2021 22:27:34 - INFO - __main__ - Step 8688: {'lr': 0.0004974856851563158, 'samples': 1668096, 'steps': 8687, 'loss/train': 1.6163461208343506} +11/06/2021 22:27:34 - INFO - __main__ - Step 8689: {'lr': 0.0004974849343627628, 'samples': 1668288, 'steps': 8688, 'loss/train': 2.1865105628967285} +11/06/2021 22:27:35 - INFO - __main__ - Step 8690: {'lr': 0.0004974841834576968, 'samples': 1668480, 'steps': 8689, 'loss/train': 2.0201218128204346} +11/06/2021 22:27:35 - INFO - __main__ - Step 8691: {'lr': 0.0004974834324411183, 'samples': 1668672, 'steps': 8690, 'loss/train': 1.748487949371338} +11/06/2021 22:27:35 - INFO - __main__ - Step 8692: {'lr': 0.0004974826813130276, 'samples': 1668864, 'steps': 8691, 'loss/train': 1.8078097105026245} +11/06/2021 22:27:36 - INFO - __main__ - Step 8693: {'lr': 0.000497481930073425, 'samples': 1669056, 'steps': 8692, 'loss/train': 1.9291731119155884} +11/06/2021 22:27:37 - INFO - __main__ - Step 8694: {'lr': 0.000497481178722311, 'samples': 1669248, 'steps': 8693, 'loss/train': 1.6936627626419067} +11/06/2021 22:27:37 - INFO - __main__ - Step 8695: {'lr': 0.0004974804272596857, 'samples': 1669440, 'steps': 8694, 'loss/train': 1.6667145490646362} +11/06/2021 22:27:37 - INFO - __main__ - Step 8696: {'lr': 0.0004974796756855494, 'samples': 1669632, 'steps': 8695, 'loss/train': 1.6822011470794678} +11/06/2021 22:27:38 - INFO - __main__ - Step 8697: {'lr': 0.0004974789239999027, 'samples': 1669824, 'steps': 8696, 'loss/train': 1.7184191942214966} +11/06/2021 22:27:38 - INFO - __main__ - Step 8698: {'lr': 0.0004974781722027459, 'samples': 1670016, 'steps': 8697, 'loss/train': 1.8397278785705566} +11/06/2021 22:27:39 - INFO - __main__ - Step 8699: {'lr': 0.0004974774202940791, 'samples': 1670208, 'steps': 8698, 'loss/train': 1.9065308570861816} +11/06/2021 22:27:40 - INFO - __main__ - Step 8700: {'lr': 0.000497476668273903, 'samples': 1670400, 'steps': 8699, 'loss/train': 0.9457817673683167} +11/06/2021 22:27:40 - INFO - __main__ - Step 8701: {'lr': 0.0004974759161422175, 'samples': 1670592, 'steps': 8700, 'loss/train': 1.5651483535766602} +11/06/2021 22:27:40 - INFO - __main__ - Step 8702: {'lr': 0.0004974751638990233, 'samples': 1670784, 'steps': 8701, 'loss/train': 1.9571999311447144} +11/06/2021 22:27:41 - INFO - __main__ - Step 8703: {'lr': 0.0004974744115443206, 'samples': 1670976, 'steps': 8702, 'loss/train': 1.1419717073440552} +11/06/2021 22:27:42 - INFO - __main__ - Step 8704: {'lr': 0.0004974736590781097, 'samples': 1671168, 'steps': 8703, 'loss/train': 2.3399507999420166} +11/06/2021 22:27:42 - INFO - __main__ - Step 8705: {'lr': 0.000497472906500391, 'samples': 1671360, 'steps': 8704, 'loss/train': 1.9851784706115723} +11/06/2021 22:27:43 - INFO - __main__ - Step 8706: {'lr': 0.0004974721538111649, 'samples': 1671552, 'steps': 8705, 'loss/train': 1.7644202709197998} +11/06/2021 22:27:43 - INFO - __main__ - Step 8707: {'lr': 0.0004974714010104315, 'samples': 1671744, 'steps': 8706, 'loss/train': 2.234442949295044} +11/06/2021 22:27:43 - INFO - __main__ - Step 8708: {'lr': 0.0004974706480981914, 'samples': 1671936, 'steps': 8707, 'loss/train': 1.5944517850875854} +11/06/2021 22:27:44 - INFO - __main__ - Step 8709: {'lr': 0.0004974698950744449, 'samples': 1672128, 'steps': 8708, 'loss/train': 2.5472395420074463} +11/06/2021 22:27:45 - INFO - __main__ - Step 8710: {'lr': 0.0004974691419391922, 'samples': 1672320, 'steps': 8709, 'loss/train': 1.8900412321090698} +11/06/2021 22:27:45 - INFO - __main__ - Step 8711: {'lr': 0.0004974683886924339, 'samples': 1672512, 'steps': 8710, 'loss/train': 1.7456995248794556} +11/06/2021 22:27:45 - INFO - __main__ - Step 8712: {'lr': 0.00049746763533417, 'samples': 1672704, 'steps': 8711, 'loss/train': 2.188673257827759} +11/06/2021 22:27:46 - INFO - __main__ - Step 8713: {'lr': 0.000497466881864401, 'samples': 1672896, 'steps': 8712, 'loss/train': 1.39998459815979} +11/06/2021 22:27:46 - INFO - __main__ - Step 8714: {'lr': 0.0004974661282831272, 'samples': 1673088, 'steps': 8713, 'loss/train': 1.890992522239685} +11/06/2021 22:27:47 - INFO - __main__ - Step 8715: {'lr': 0.0004974653745903491, 'samples': 1673280, 'steps': 8714, 'loss/train': 1.2863065004348755} +11/06/2021 22:27:47 - INFO - __main__ - Step 8716: {'lr': 0.0004974646207860668, 'samples': 1673472, 'steps': 8715, 'loss/train': 2.333582878112793} +11/06/2021 22:27:48 - INFO - __main__ - Step 8717: {'lr': 0.0004974638668702809, 'samples': 1673664, 'steps': 8716, 'loss/train': 0.5336604714393616} +11/06/2021 22:27:48 - INFO - __main__ - Step 8718: {'lr': 0.0004974631128429915, 'samples': 1673856, 'steps': 8717, 'loss/train': 2.640268564224243} +11/06/2021 22:27:48 - INFO - __main__ - Step 8719: {'lr': 0.0004974623587041991, 'samples': 1674048, 'steps': 8718, 'loss/train': 2.1433913707733154} +11/06/2021 22:27:49 - INFO - __main__ - Step 8720: {'lr': 0.000497461604453904, 'samples': 1674240, 'steps': 8719, 'loss/train': 1.5393385887145996} +11/06/2021 22:27:50 - INFO - __main__ - Step 8721: {'lr': 0.0004974608500921064, 'samples': 1674432, 'steps': 8720, 'loss/train': 2.028142213821411} +11/06/2021 22:27:50 - INFO - __main__ - Step 8722: {'lr': 0.0004974600956188068, 'samples': 1674624, 'steps': 8721, 'loss/train': 1.8649543523788452} +11/06/2021 22:27:50 - INFO - __main__ - Step 8723: {'lr': 0.0004974593410340056, 'samples': 1674816, 'steps': 8722, 'loss/train': 1.037925124168396} +11/06/2021 22:27:51 - INFO - __main__ - Step 8724: {'lr': 0.000497458586337703, 'samples': 1675008, 'steps': 8723, 'loss/train': 1.7672851085662842} +11/06/2021 22:27:52 - INFO - __main__ - Step 8725: {'lr': 0.0004974578315298993, 'samples': 1675200, 'steps': 8724, 'loss/train': 1.966469407081604} +11/06/2021 22:27:52 - INFO - __main__ - Step 8726: {'lr': 0.000497457076610595, 'samples': 1675392, 'steps': 8725, 'loss/train': 1.7877483367919922} +11/06/2021 22:27:53 - INFO - __main__ - Step 8727: {'lr': 0.0004974563215797903, 'samples': 1675584, 'steps': 8726, 'loss/train': 1.3742201328277588} +11/06/2021 22:27:53 - INFO - __main__ - Step 8728: {'lr': 0.0004974555664374857, 'samples': 1675776, 'steps': 8727, 'loss/train': 2.265516757965088} +11/06/2021 22:27:53 - INFO - __main__ - Step 8729: {'lr': 0.0004974548111836812, 'samples': 1675968, 'steps': 8728, 'loss/train': 1.7990782260894775} +11/06/2021 22:27:54 - INFO - __main__ - Step 8730: {'lr': 0.0004974540558183776, 'samples': 1676160, 'steps': 8729, 'loss/train': 1.5700663328170776} +11/06/2021 22:27:55 - INFO - __main__ - Step 8731: {'lr': 0.0004974533003415751, 'samples': 1676352, 'steps': 8730, 'loss/train': 2.584472894668579} +11/06/2021 22:27:55 - INFO - __main__ - Step 8732: {'lr': 0.0004974525447532737, 'samples': 1676544, 'steps': 8731, 'loss/train': 0.7004466652870178} +11/06/2021 22:27:55 - INFO - __main__ - Step 8733: {'lr': 0.0004974517890534742, 'samples': 1676736, 'steps': 8732, 'loss/train': 2.029585361480713} +11/06/2021 22:27:56 - INFO - __main__ - Step 8734: {'lr': 0.0004974510332421767, 'samples': 1676928, 'steps': 8733, 'loss/train': 2.3354976177215576} +11/06/2021 22:27:57 - INFO - __main__ - Step 8735: {'lr': 0.0004974502773193815, 'samples': 1677120, 'steps': 8734, 'loss/train': 1.779792308807373} +11/06/2021 22:27:57 - INFO - __main__ - Step 8736: {'lr': 0.0004974495212850892, 'samples': 1677312, 'steps': 8735, 'loss/train': 1.7999184131622314} +11/06/2021 22:27:58 - INFO - __main__ - Step 8737: {'lr': 0.0004974487651392998, 'samples': 1677504, 'steps': 8736, 'loss/train': 2.0719504356384277} +11/06/2021 22:27:58 - INFO - __main__ - Step 8738: {'lr': 0.0004974480088820139, 'samples': 1677696, 'steps': 8737, 'loss/train': 1.93135666847229} +11/06/2021 22:27:59 - INFO - __main__ - Step 8739: {'lr': 0.0004974472525132316, 'samples': 1677888, 'steps': 8738, 'loss/train': 2.191235303878784} +11/06/2021 22:27:59 - INFO - __main__ - Step 8740: {'lr': 0.0004974464960329536, 'samples': 1678080, 'steps': 8739, 'loss/train': 1.711877465248108} +11/06/2021 22:28:00 - INFO - __main__ - Step 8741: {'lr': 0.0004974457394411798, 'samples': 1678272, 'steps': 8740, 'loss/train': 1.1441311836242676} +11/06/2021 22:28:00 - INFO - __main__ - Step 8742: {'lr': 0.0004974449827379109, 'samples': 1678464, 'steps': 8741, 'loss/train': 2.325981616973877} +11/06/2021 22:28:01 - INFO - __main__ - Step 8743: {'lr': 0.000497444225923147, 'samples': 1678656, 'steps': 8742, 'loss/train': 1.826312780380249} +11/06/2021 22:28:01 - INFO - __main__ - Step 8744: {'lr': 0.0004974434689968887, 'samples': 1678848, 'steps': 8743, 'loss/train': 2.2900896072387695} +11/06/2021 22:28:01 - INFO - __main__ - Step 8745: {'lr': 0.0004974427119591361, 'samples': 1679040, 'steps': 8744, 'loss/train': 2.352595090866089} +11/06/2021 22:28:02 - INFO - __main__ - Step 8746: {'lr': 0.0004974419548098897, 'samples': 1679232, 'steps': 8745, 'loss/train': 1.2469137907028198} +11/06/2021 22:28:03 - INFO - __main__ - Step 8747: {'lr': 0.0004974411975491498, 'samples': 1679424, 'steps': 8746, 'loss/train': 1.8148316144943237} +11/06/2021 22:28:03 - INFO - __main__ - Step 8748: {'lr': 0.0004974404401769167, 'samples': 1679616, 'steps': 8747, 'loss/train': 2.2442069053649902} +11/06/2021 22:28:03 - INFO - __main__ - Step 8749: {'lr': 0.0004974396826931906, 'samples': 1679808, 'steps': 8748, 'loss/train': 2.0725631713867188} +11/06/2021 22:28:04 - INFO - __main__ - Step 8750: {'lr': 0.0004974389250979722, 'samples': 1680000, 'steps': 8749, 'loss/train': 1.7763142585754395} +11/06/2021 22:28:05 - INFO - __main__ - Step 8751: {'lr': 0.0004974381673912614, 'samples': 1680192, 'steps': 8750, 'loss/train': 2.2424070835113525} +11/06/2021 22:28:05 - INFO - __main__ - Step 8752: {'lr': 0.000497437409573059, 'samples': 1680384, 'steps': 8751, 'loss/train': 1.8414136171340942} +11/06/2021 22:28:05 - INFO - __main__ - Step 8753: {'lr': 0.000497436651643365, 'samples': 1680576, 'steps': 8752, 'loss/train': 1.7458195686340332} +11/06/2021 22:28:06 - INFO - __main__ - Step 8754: {'lr': 0.00049743589360218, 'samples': 1680768, 'steps': 8753, 'loss/train': 2.1746933460235596} +11/06/2021 22:28:06 - INFO - __main__ - Step 8755: {'lr': 0.0004974351354495041, 'samples': 1680960, 'steps': 8754, 'loss/train': 1.9091649055480957} +11/06/2021 22:28:07 - INFO - __main__ - Step 8756: {'lr': 0.0004974343771853377, 'samples': 1681152, 'steps': 8755, 'loss/train': 1.7813023328781128} +11/06/2021 22:28:07 - INFO - __main__ - Step 8757: {'lr': 0.0004974336188096813, 'samples': 1681344, 'steps': 8756, 'loss/train': 1.627087116241455} +11/06/2021 22:28:08 - INFO - __main__ - Step 8758: {'lr': 0.0004974328603225351, 'samples': 1681536, 'steps': 8757, 'loss/train': 1.492101788520813} +11/06/2021 22:28:08 - INFO - __main__ - Step 8759: {'lr': 0.0004974321017238994, 'samples': 1681728, 'steps': 8758, 'loss/train': 1.5569329261779785} +11/06/2021 22:28:09 - INFO - __main__ - Step 8760: {'lr': 0.0004974313430137747, 'samples': 1681920, 'steps': 8759, 'loss/train': 1.9305700063705444} +11/06/2021 22:28:10 - INFO - __main__ - Step 8761: {'lr': 0.0004974305841921612, 'samples': 1682112, 'steps': 8760, 'loss/train': 1.7186388969421387} +11/06/2021 22:28:10 - INFO - __main__ - Step 8762: {'lr': 0.0004974298252590593, 'samples': 1682304, 'steps': 8761, 'loss/train': 1.9467127323150635} +11/06/2021 22:28:10 - INFO - __main__ - Step 8763: {'lr': 0.0004974290662144694, 'samples': 1682496, 'steps': 8762, 'loss/train': 1.675337791442871} +11/06/2021 22:28:11 - INFO - __main__ - Step 8764: {'lr': 0.0004974283070583917, 'samples': 1682688, 'steps': 8763, 'loss/train': 1.5082322359085083} +11/06/2021 22:28:11 - INFO - __main__ - Step 8765: {'lr': 0.0004974275477908266, 'samples': 1682880, 'steps': 8764, 'loss/train': 2.1924538612365723} +11/06/2021 22:28:12 - INFO - __main__ - Step 8766: {'lr': 0.0004974267884117746, 'samples': 1683072, 'steps': 8765, 'loss/train': 0.8508917093276978} +11/06/2021 22:28:12 - INFO - __main__ - Step 8767: {'lr': 0.0004974260289212358, 'samples': 1683264, 'steps': 8766, 'loss/train': 1.8229551315307617} +11/06/2021 22:28:13 - INFO - __main__ - Step 8768: {'lr': 0.0004974252693192106, 'samples': 1683456, 'steps': 8767, 'loss/train': 1.7984812259674072} +11/06/2021 22:28:13 - INFO - __main__ - Step 8769: {'lr': 0.0004974245096056995, 'samples': 1683648, 'steps': 8768, 'loss/train': 1.664389729499817} +11/06/2021 22:28:13 - INFO - __main__ - Step 8770: {'lr': 0.0004974237497807027, 'samples': 1683840, 'steps': 8769, 'loss/train': 0.3073934018611908} +11/06/2021 22:28:14 - INFO - __main__ - Step 8771: {'lr': 0.0004974229898442207, 'samples': 1684032, 'steps': 8770, 'loss/train': 1.7521414756774902} +11/06/2021 22:28:15 - INFO - __main__ - Step 8772: {'lr': 0.0004974222297962535, 'samples': 1684224, 'steps': 8771, 'loss/train': 1.6954983472824097} +11/06/2021 22:28:15 - INFO - __main__ - Step 8773: {'lr': 0.0004974214696368017, 'samples': 1684416, 'steps': 8772, 'loss/train': 1.7648489475250244} +11/06/2021 22:28:15 - INFO - __main__ - Step 8774: {'lr': 0.0004974207093658657, 'samples': 1684608, 'steps': 8773, 'loss/train': 1.5386720895767212} +11/06/2021 22:28:16 - INFO - __main__ - Step 8775: {'lr': 0.0004974199489834457, 'samples': 1684800, 'steps': 8774, 'loss/train': 1.757877230644226} +11/06/2021 22:28:17 - INFO - __main__ - Step 8776: {'lr': 0.0004974191884895421, 'samples': 1684992, 'steps': 8775, 'loss/train': 1.9185556173324585} +11/06/2021 22:28:17 - INFO - __main__ - Step 8777: {'lr': 0.0004974184278841552, 'samples': 1685184, 'steps': 8776, 'loss/train': 2.359382152557373} +11/06/2021 22:28:18 - INFO - __main__ - Step 8778: {'lr': 0.0004974176671672854, 'samples': 1685376, 'steps': 8777, 'loss/train': 1.3928838968276978} +11/06/2021 22:28:18 - INFO - __main__ - Step 8779: {'lr': 0.000497416906338933, 'samples': 1685568, 'steps': 8778, 'loss/train': 2.1888182163238525} +11/06/2021 22:28:18 - INFO - __main__ - Step 8780: {'lr': 0.0004974161453990985, 'samples': 1685760, 'steps': 8779, 'loss/train': 1.9797148704528809} +11/06/2021 22:28:19 - INFO - __main__ - Step 8781: {'lr': 0.0004974153843477819, 'samples': 1685952, 'steps': 8780, 'loss/train': 1.6259188652038574} +11/06/2021 22:28:20 - INFO - __main__ - Step 8782: {'lr': 0.0004974146231849838, 'samples': 1686144, 'steps': 8781, 'loss/train': 1.612627387046814} +11/06/2021 22:28:20 - INFO - __main__ - Step 8783: {'lr': 0.0004974138619107046, 'samples': 1686336, 'steps': 8782, 'loss/train': 1.9349783658981323} +11/06/2021 22:28:20 - INFO - __main__ - Step 8784: {'lr': 0.0004974131005249444, 'samples': 1686528, 'steps': 8783, 'loss/train': 1.3217498064041138} +11/06/2021 22:28:21 - INFO - __main__ - Step 8785: {'lr': 0.0004974123390277037, 'samples': 1686720, 'steps': 8784, 'loss/train': 0.9705907702445984} +11/06/2021 22:28:21 - INFO - __main__ - Step 8786: {'lr': 0.0004974115774189829, 'samples': 1686912, 'steps': 8785, 'loss/train': 1.2650182247161865} +11/06/2021 22:28:22 - INFO - __main__ - Step 8787: {'lr': 0.0004974108156987822, 'samples': 1687104, 'steps': 8786, 'loss/train': 1.8180323839187622} +11/06/2021 22:28:23 - INFO - __main__ - Step 8788: {'lr': 0.000497410053867102, 'samples': 1687296, 'steps': 8787, 'loss/train': 2.028273105621338} +11/06/2021 22:28:23 - INFO - __main__ - Step 8789: {'lr': 0.0004974092919239427, 'samples': 1687488, 'steps': 8788, 'loss/train': 1.8566056489944458} +11/06/2021 22:28:23 - INFO - __main__ - Step 8790: {'lr': 0.0004974085298693045, 'samples': 1687680, 'steps': 8789, 'loss/train': 1.7841997146606445} +11/06/2021 22:28:24 - INFO - __main__ - Step 8791: {'lr': 0.0004974077677031879, 'samples': 1687872, 'steps': 8790, 'loss/train': 1.7749842405319214} +11/06/2021 22:28:25 - INFO - __main__ - Step 8792: {'lr': 0.0004974070054255932, 'samples': 1688064, 'steps': 8791, 'loss/train': 1.3394575119018555} +11/06/2021 22:28:25 - INFO - __main__ - Step 8793: {'lr': 0.0004974062430365206, 'samples': 1688256, 'steps': 8792, 'loss/train': 2.017791509628296} +11/06/2021 22:28:25 - INFO - __main__ - Step 8794: {'lr': 0.0004974054805359706, 'samples': 1688448, 'steps': 8793, 'loss/train': 1.5951640605926514} +11/06/2021 22:28:26 - INFO - __main__ - Step 8795: {'lr': 0.0004974047179239436, 'samples': 1688640, 'steps': 8794, 'loss/train': 1.9513581991195679} +11/06/2021 22:28:26 - INFO - __main__ - Step 8796: {'lr': 0.0004974039552004398, 'samples': 1688832, 'steps': 8795, 'loss/train': 1.227823257446289} +11/06/2021 22:28:27 - INFO - __main__ - Step 8797: {'lr': 0.0004974031923654596, 'samples': 1689024, 'steps': 8796, 'loss/train': 1.9323481321334839} +11/06/2021 22:28:27 - INFO - __main__ - Step 8798: {'lr': 0.0004974024294190034, 'samples': 1689216, 'steps': 8797, 'loss/train': 1.6938538551330566} +11/06/2021 22:28:28 - INFO - __main__ - Step 8799: {'lr': 0.0004974016663610713, 'samples': 1689408, 'steps': 8798, 'loss/train': 1.885172724723816} +11/06/2021 22:28:28 - INFO - __main__ - Step 8800: {'lr': 0.000497400903191664, 'samples': 1689600, 'steps': 8799, 'loss/train': 1.5480501651763916} +11/06/2021 22:28:28 - INFO - __main__ - Step 8801: {'lr': 0.0004974001399107816, 'samples': 1689792, 'steps': 8800, 'loss/train': 2.519402265548706} +11/06/2021 22:28:29 - INFO - __main__ - Step 8802: {'lr': 0.0004973993765184246, 'samples': 1689984, 'steps': 8801, 'loss/train': 1.6957279443740845} +11/06/2021 22:28:30 - INFO - __main__ - Step 8803: {'lr': 0.0004973986130145931, 'samples': 1690176, 'steps': 8802, 'loss/train': 1.698414921760559} +11/06/2021 22:28:30 - INFO - __main__ - Step 8804: {'lr': 0.0004973978493992877, 'samples': 1690368, 'steps': 8803, 'loss/train': 1.4111169576644897} +11/06/2021 22:28:30 - INFO - __main__ - Step 8805: {'lr': 0.0004973970856725086, 'samples': 1690560, 'steps': 8804, 'loss/train': 1.862740159034729} +11/06/2021 22:28:31 - INFO - __main__ - Step 8806: {'lr': 0.0004973963218342563, 'samples': 1690752, 'steps': 8805, 'loss/train': 1.8943990468978882} +11/06/2021 22:28:32 - INFO - __main__ - Step 8807: {'lr': 0.000497395557884531, 'samples': 1690944, 'steps': 8806, 'loss/train': 2.2840816974639893} +11/06/2021 22:28:32 - INFO - __main__ - Step 8808: {'lr': 0.000497394793823333, 'samples': 1691136, 'steps': 8807, 'loss/train': 1.346774697303772} +11/06/2021 22:28:33 - INFO - __main__ - Step 8809: {'lr': 0.0004973940296506627, 'samples': 1691328, 'steps': 8808, 'loss/train': 1.4218136072158813} +11/06/2021 22:28:33 - INFO - __main__ - Step 8810: {'lr': 0.0004973932653665206, 'samples': 1691520, 'steps': 8809, 'loss/train': 0.507257878780365} +11/06/2021 22:28:33 - INFO - __main__ - Step 8811: {'lr': 0.0004973925009709068, 'samples': 1691712, 'steps': 8810, 'loss/train': 1.9113545417785645} +11/06/2021 22:28:34 - INFO - __main__ - Step 8812: {'lr': 0.0004973917364638218, 'samples': 1691904, 'steps': 8811, 'loss/train': 1.7712737321853638} +11/06/2021 22:28:34 - INFO - __main__ - Step 8813: {'lr': 0.0004973909718452659, 'samples': 1692096, 'steps': 8812, 'loss/train': 2.098034381866455} +11/06/2021 22:28:35 - INFO - __main__ - Step 8814: {'lr': 0.0004973902071152396, 'samples': 1692288, 'steps': 8813, 'loss/train': 1.7307425737380981} +11/06/2021 22:28:35 - INFO - __main__ - Step 8815: {'lr': 0.0004973894422737428, 'samples': 1692480, 'steps': 8814, 'loss/train': 1.682647466659546} +11/06/2021 22:28:36 - INFO - __main__ - Step 8816: {'lr': 0.0004973886773207763, 'samples': 1692672, 'steps': 8815, 'loss/train': 1.6713685989379883} +11/06/2021 22:28:37 - INFO - __main__ - Step 8817: {'lr': 0.0004973879122563403, 'samples': 1692864, 'steps': 8816, 'loss/train': 2.685642957687378} +11/06/2021 22:28:37 - INFO - __main__ - Step 8818: {'lr': 0.000497387147080435, 'samples': 1693056, 'steps': 8817, 'loss/train': 1.6026307344436646} +11/06/2021 22:28:37 - INFO - __main__ - Step 8819: {'lr': 0.000497386381793061, 'samples': 1693248, 'steps': 8818, 'loss/train': 1.8597676753997803} +11/06/2021 22:28:38 - INFO - __main__ - Step 8820: {'lr': 0.0004973856163942185, 'samples': 1693440, 'steps': 8819, 'loss/train': 1.8286590576171875} +11/06/2021 22:28:38 - INFO - __main__ - Step 8821: {'lr': 0.0004973848508839077, 'samples': 1693632, 'steps': 8820, 'loss/train': 1.868646264076233} +11/06/2021 22:28:38 - INFO - __main__ - Step 8822: {'lr': 0.0004973840852621293, 'samples': 1693824, 'steps': 8821, 'loss/train': 1.4488940238952637} +11/06/2021 22:28:39 - INFO - __main__ - Step 8823: {'lr': 0.0004973833195288834, 'samples': 1694016, 'steps': 8822, 'loss/train': 1.7625603675842285} +11/06/2021 22:28:40 - INFO - __main__ - Step 8824: {'lr': 0.0004973825536841703, 'samples': 1694208, 'steps': 8823, 'loss/train': 1.8687225580215454} +11/06/2021 22:28:40 - INFO - __main__ - Step 8825: {'lr': 0.0004973817877279906, 'samples': 1694400, 'steps': 8824, 'loss/train': 1.4771027565002441} +11/06/2021 22:28:41 - INFO - __main__ - Step 8826: {'lr': 0.0004973810216603443, 'samples': 1694592, 'steps': 8825, 'loss/train': 0.3064444959163666} +11/06/2021 22:28:41 - INFO - __main__ - Step 8827: {'lr': 0.000497380255481232, 'samples': 1694784, 'steps': 8826, 'loss/train': 1.9688664674758911} +11/06/2021 22:28:42 - INFO - __main__ - Step 8828: {'lr': 0.000497379489190654, 'samples': 1694976, 'steps': 8827, 'loss/train': 1.279405117034912} +11/06/2021 22:28:42 - INFO - __main__ - Step 8829: {'lr': 0.0004973787227886106, 'samples': 1695168, 'steps': 8828, 'loss/train': 1.0162687301635742} +11/06/2021 22:28:43 - INFO - __main__ - Step 8830: {'lr': 0.0004973779562751022, 'samples': 1695360, 'steps': 8829, 'loss/train': 1.7933107614517212} +11/06/2021 22:28:43 - INFO - __main__ - Step 8831: {'lr': 0.0004973771896501292, 'samples': 1695552, 'steps': 8830, 'loss/train': 2.0314056873321533} +11/06/2021 22:28:43 - INFO - __main__ - Step 8832: {'lr': 0.0004973764229136917, 'samples': 1695744, 'steps': 8831, 'loss/train': 1.8036915063858032} +11/06/2021 22:28:44 - INFO - __main__ - Step 8833: {'lr': 0.0004973756560657901, 'samples': 1695936, 'steps': 8832, 'loss/train': 1.417937994003296} +11/06/2021 22:28:45 - INFO - __main__ - Step 8834: {'lr': 0.0004973748891064251, 'samples': 1696128, 'steps': 8833, 'loss/train': 1.0796078443527222} +11/06/2021 22:28:45 - INFO - __main__ - Step 8835: {'lr': 0.0004973741220355967, 'samples': 1696320, 'steps': 8834, 'loss/train': 1.756775975227356} +11/06/2021 22:28:45 - INFO - __main__ - Step 8836: {'lr': 0.0004973733548533052, 'samples': 1696512, 'steps': 8835, 'loss/train': 1.7436381578445435} +11/06/2021 22:28:46 - INFO - __main__ - Step 8837: {'lr': 0.0004973725875595513, 'samples': 1696704, 'steps': 8836, 'loss/train': 2.336061716079712} +11/06/2021 22:28:47 - INFO - __main__ - Step 8838: {'lr': 0.000497371820154335, 'samples': 1696896, 'steps': 8837, 'loss/train': 1.9740123748779297} +11/06/2021 22:28:47 - INFO - __main__ - Step 8839: {'lr': 0.0004973710526376569, 'samples': 1697088, 'steps': 8838, 'loss/train': 0.7141327261924744} +11/06/2021 22:28:47 - INFO - __main__ - Step 8840: {'lr': 0.000497370285009517, 'samples': 1697280, 'steps': 8839, 'loss/train': 1.4266327619552612} +11/06/2021 22:28:48 - INFO - __main__ - Step 8841: {'lr': 0.000497369517269916, 'samples': 1697472, 'steps': 8840, 'loss/train': 2.1014244556427} +11/06/2021 22:28:48 - INFO - __main__ - Step 8842: {'lr': 0.0004973687494188541, 'samples': 1697664, 'steps': 8841, 'loss/train': 1.9083147048950195} +11/06/2021 22:28:49 - INFO - __main__ - Step 8843: {'lr': 0.0004973679814563318, 'samples': 1697856, 'steps': 8842, 'loss/train': 1.9293524026870728} +11/06/2021 22:28:50 - INFO - __main__ - Step 8844: {'lr': 0.0004973672133823491, 'samples': 1698048, 'steps': 8843, 'loss/train': 1.9651559591293335} +11/06/2021 22:28:50 - INFO - __main__ - Step 8845: {'lr': 0.0004973664451969066, 'samples': 1698240, 'steps': 8844, 'loss/train': 2.337369203567505} +11/06/2021 22:28:50 - INFO - __main__ - Step 8846: {'lr': 0.0004973656769000046, 'samples': 1698432, 'steps': 8845, 'loss/train': 1.0025054216384888} +11/06/2021 22:28:51 - INFO - __main__ - Step 8847: {'lr': 0.0004973649084916435, 'samples': 1698624, 'steps': 8846, 'loss/train': 2.6142988204956055} +11/06/2021 22:28:52 - INFO - __main__ - Step 8848: {'lr': 0.0004973641399718236, 'samples': 1698816, 'steps': 8847, 'loss/train': 2.0085182189941406} +11/06/2021 22:28:52 - INFO - __main__ - Step 8849: {'lr': 0.0004973633713405451, 'samples': 1699008, 'steps': 8848, 'loss/train': 1.4306745529174805} +11/06/2021 22:28:53 - INFO - __main__ - Step 8850: {'lr': 0.0004973626025978086, 'samples': 1699200, 'steps': 8849, 'loss/train': 1.551592469215393} +11/06/2021 22:28:53 - INFO - __main__ - Step 8851: {'lr': 0.0004973618337436143, 'samples': 1699392, 'steps': 8850, 'loss/train': 1.7350374460220337} +11/06/2021 22:28:53 - INFO - __main__ - Step 8852: {'lr': 0.0004973610647779626, 'samples': 1699584, 'steps': 8851, 'loss/train': 1.860516905784607} +11/06/2021 22:28:54 - INFO - __main__ - Step 8853: {'lr': 0.0004973602957008537, 'samples': 1699776, 'steps': 8852, 'loss/train': 1.765555739402771} +11/06/2021 22:28:55 - INFO - __main__ - Step 8854: {'lr': 0.0004973595265122883, 'samples': 1699968, 'steps': 8853, 'loss/train': 2.4081969261169434} +11/06/2021 22:28:55 - INFO - __main__ - Step 8855: {'lr': 0.0004973587572122663, 'samples': 1700160, 'steps': 8854, 'loss/train': 1.8850605487823486} +11/06/2021 22:28:55 - INFO - __main__ - Step 8856: {'lr': 0.0004973579878007884, 'samples': 1700352, 'steps': 8855, 'loss/train': 1.608045220375061} +11/06/2021 22:28:56 - INFO - __main__ - Step 8857: {'lr': 0.0004973572182778546, 'samples': 1700544, 'steps': 8856, 'loss/train': 1.670106291770935} +11/06/2021 22:28:56 - INFO - __main__ - Step 8858: {'lr': 0.0004973564486434656, 'samples': 1700736, 'steps': 8857, 'loss/train': 1.6520261764526367} +11/06/2021 22:28:57 - INFO - __main__ - Step 8859: {'lr': 0.0004973556788976217, 'samples': 1700928, 'steps': 8858, 'loss/train': 1.5881348848342896} +11/06/2021 22:28:57 - INFO - __main__ - Step 8860: {'lr': 0.000497354909040323, 'samples': 1701120, 'steps': 8859, 'loss/train': 1.7174054384231567} +11/06/2021 22:28:58 - INFO - __main__ - Step 8861: {'lr': 0.00049735413907157, 'samples': 1701312, 'steps': 8860, 'loss/train': 1.8992524147033691} +11/06/2021 22:28:58 - INFO - __main__ - Step 8862: {'lr': 0.0004973533689913631, 'samples': 1701504, 'steps': 8861, 'loss/train': 1.570049524307251} +11/06/2021 22:28:58 - INFO - __main__ - Step 8863: {'lr': 0.0004973525987997026, 'samples': 1701696, 'steps': 8862, 'loss/train': 2.445530891418457} +11/06/2021 22:28:59 - INFO - __main__ - Step 8864: {'lr': 0.0004973518284965888, 'samples': 1701888, 'steps': 8863, 'loss/train': 1.9217685461044312} +11/06/2021 22:29:00 - INFO - __main__ - Step 8865: {'lr': 0.0004973510580820221, 'samples': 1702080, 'steps': 8864, 'loss/train': 1.8503520488739014} +11/06/2021 22:29:00 - INFO - __main__ - Step 8866: {'lr': 0.0004973502875560028, 'samples': 1702272, 'steps': 8865, 'loss/train': 1.635284185409546} +11/06/2021 22:29:01 - INFO - __main__ - Step 8867: {'lr': 0.0004973495169185313, 'samples': 1702464, 'steps': 8866, 'loss/train': 1.2922062873840332} +11/06/2021 22:29:01 - INFO - __main__ - Step 8868: {'lr': 0.0004973487461696079, 'samples': 1702656, 'steps': 8867, 'loss/train': 1.878747820854187} +11/06/2021 22:29:02 - INFO - __main__ - Step 8869: {'lr': 0.000497347975309233, 'samples': 1702848, 'steps': 8868, 'loss/train': 1.7777513265609741} +11/06/2021 22:29:02 - INFO - __main__ - Step 8870: {'lr': 0.0004973472043374069, 'samples': 1703040, 'steps': 8869, 'loss/train': 1.8679721355438232} +11/06/2021 22:29:03 - INFO - __main__ - Step 8871: {'lr': 0.00049734643325413, 'samples': 1703232, 'steps': 8870, 'loss/train': 1.7162529230117798} +11/06/2021 22:29:03 - INFO - __main__ - Step 8872: {'lr': 0.0004973456620594026, 'samples': 1703424, 'steps': 8871, 'loss/train': 1.8824801445007324} +11/06/2021 22:29:03 - INFO - __main__ - Step 8873: {'lr': 0.0004973448907532251, 'samples': 1703616, 'steps': 8872, 'loss/train': 1.3267327547073364} +11/06/2021 22:29:04 - INFO - __main__ - Step 8874: {'lr': 0.0004973441193355978, 'samples': 1703808, 'steps': 8873, 'loss/train': 2.032459259033203} +11/06/2021 22:29:05 - INFO - __main__ - Step 8875: {'lr': 0.0004973433478065209, 'samples': 1704000, 'steps': 8874, 'loss/train': 1.6638219356536865} +11/06/2021 22:29:05 - INFO - __main__ - Step 8876: {'lr': 0.0004973425761659951, 'samples': 1704192, 'steps': 8875, 'loss/train': 1.3877533674240112} +11/06/2021 22:29:05 - INFO - __main__ - Step 8877: {'lr': 0.0004973418044140204, 'samples': 1704384, 'steps': 8876, 'loss/train': 1.6968107223510742} +11/06/2021 22:29:06 - INFO - __main__ - Step 8878: {'lr': 0.0004973410325505974, 'samples': 1704576, 'steps': 8877, 'loss/train': 0.47580868005752563} +11/06/2021 22:29:07 - INFO - __main__ - Step 8879: {'lr': 0.0004973402605757263, 'samples': 1704768, 'steps': 8878, 'loss/train': 1.8513538837432861} +11/06/2021 22:29:07 - INFO - __main__ - Step 8880: {'lr': 0.0004973394884894075, 'samples': 1704960, 'steps': 8879, 'loss/train': 1.8675156831741333} +11/06/2021 22:29:08 - INFO - __main__ - Step 8881: {'lr': 0.0004973387162916415, 'samples': 1705152, 'steps': 8880, 'loss/train': 1.1261378526687622} +11/06/2021 22:29:08 - INFO - __main__ - Step 8882: {'lr': 0.0004973379439824283, 'samples': 1705344, 'steps': 8881, 'loss/train': 2.2020576000213623} +11/06/2021 22:29:09 - INFO - __main__ - Step 8883: {'lr': 0.0004973371715617685, 'samples': 1705536, 'steps': 8882, 'loss/train': 1.241743803024292} +11/06/2021 22:29:09 - INFO - __main__ - Step 8884: {'lr': 0.0004973363990296624, 'samples': 1705728, 'steps': 8883, 'loss/train': 1.7667030096054077} +11/06/2021 22:29:10 - INFO - __main__ - Step 8885: {'lr': 0.0004973356263861103, 'samples': 1705920, 'steps': 8884, 'loss/train': 1.5185878276824951} +11/06/2021 22:29:10 - INFO - __main__ - Step 8886: {'lr': 0.0004973348536311126, 'samples': 1706112, 'steps': 8885, 'loss/train': 2.001230001449585} +11/06/2021 22:29:11 - INFO - __main__ - Step 8887: {'lr': 0.0004973340807646696, 'samples': 1706304, 'steps': 8886, 'loss/train': 2.3790831565856934} +11/06/2021 22:29:11 - INFO - __main__ - Step 8888: {'lr': 0.0004973333077867817, 'samples': 1706496, 'steps': 8887, 'loss/train': 1.9295786619186401} +11/06/2021 22:29:11 - INFO - __main__ - Step 8889: {'lr': 0.0004973325346974493, 'samples': 1706688, 'steps': 8888, 'loss/train': 1.372741937637329} +11/06/2021 22:29:13 - INFO - __main__ - Step 8890: {'lr': 0.0004973317614966726, 'samples': 1706880, 'steps': 8889, 'loss/train': 2.034008502960205} +11/06/2021 22:29:13 - INFO - __main__ - Step 8891: {'lr': 0.000497330988184452, 'samples': 1707072, 'steps': 8890, 'loss/train': 1.9604440927505493} +11/06/2021 22:29:13 - INFO - __main__ - Step 8892: {'lr': 0.000497330214760788, 'samples': 1707264, 'steps': 8891, 'loss/train': 0.9298360347747803} +11/06/2021 22:29:14 - INFO - __main__ - Step 8893: {'lr': 0.0004973294412256807, 'samples': 1707456, 'steps': 8892, 'loss/train': 1.6712414026260376} +11/06/2021 22:29:14 - INFO - __main__ - Step 8894: {'lr': 0.0004973286675791305, 'samples': 1707648, 'steps': 8893, 'loss/train': 1.9249519109725952} +11/06/2021 22:29:15 - INFO - __main__ - Step 8895: {'lr': 0.000497327893821138, 'samples': 1707840, 'steps': 8894, 'loss/train': 1.5401326417922974} +11/06/2021 22:29:15 - INFO - __main__ - Step 8896: {'lr': 0.0004973271199517033, 'samples': 1708032, 'steps': 8895, 'loss/train': 1.5258654356002808} +11/06/2021 22:29:16 - INFO - __main__ - Step 8897: {'lr': 0.0004973263459708268, 'samples': 1708224, 'steps': 8896, 'loss/train': 1.3488224744796753} +11/06/2021 22:29:16 - INFO - __main__ - Step 8898: {'lr': 0.0004973255718785088, 'samples': 1708416, 'steps': 8897, 'loss/train': 1.7817871570587158} +11/06/2021 22:29:16 - INFO - __main__ - Step 8899: {'lr': 0.0004973247976747499, 'samples': 1708608, 'steps': 8898, 'loss/train': 1.7609913349151611} +11/06/2021 22:29:17 - INFO - __main__ - Step 8900: {'lr': 0.00049732402335955, 'samples': 1708800, 'steps': 8899, 'loss/train': 1.659672737121582} +11/06/2021 22:29:18 - INFO - __main__ - Step 8901: {'lr': 0.0004973232489329099, 'samples': 1708992, 'steps': 8900, 'loss/train': 1.438830852508545} +11/06/2021 22:29:18 - INFO - __main__ - Step 8902: {'lr': 0.0004973224743948298, 'samples': 1709184, 'steps': 8901, 'loss/train': 2.05006742477417} +11/06/2021 22:29:18 - INFO - __main__ - Step 8903: {'lr': 0.00049732169974531, 'samples': 1709376, 'steps': 8902, 'loss/train': 1.8295646905899048} +11/06/2021 22:29:19 - INFO - __main__ - Step 8904: {'lr': 0.0004973209249843507, 'samples': 1709568, 'steps': 8903, 'loss/train': 1.4633625745773315} +11/06/2021 22:29:19 - INFO - __main__ - Step 8905: {'lr': 0.0004973201501119525, 'samples': 1709760, 'steps': 8904, 'loss/train': 1.7192811965942383} +11/06/2021 22:29:20 - INFO - __main__ - Step 8906: {'lr': 0.0004973193751281156, 'samples': 1709952, 'steps': 8905, 'loss/train': 1.834681510925293} +11/06/2021 22:29:20 - INFO - __main__ - Step 8907: {'lr': 0.0004973186000328405, 'samples': 1710144, 'steps': 8906, 'loss/train': 1.5164721012115479} +11/06/2021 22:29:21 - INFO - __main__ - Step 8908: {'lr': 0.0004973178248261274, 'samples': 1710336, 'steps': 8907, 'loss/train': 2.1482808589935303} +11/06/2021 22:29:21 - INFO - __main__ - Step 8909: {'lr': 0.0004973170495079768, 'samples': 1710528, 'steps': 8908, 'loss/train': 2.774986505508423} +11/06/2021 22:29:22 - INFO - __main__ - Step 8910: {'lr': 0.0004973162740783888, 'samples': 1710720, 'steps': 8909, 'loss/train': 1.804287075996399} +11/06/2021 22:29:23 - INFO - __main__ - Step 8911: {'lr': 0.000497315498537364, 'samples': 1710912, 'steps': 8910, 'loss/train': 1.4533205032348633} +11/06/2021 22:29:23 - INFO - __main__ - Step 8912: {'lr': 0.0004973147228849027, 'samples': 1711104, 'steps': 8911, 'loss/train': 1.924820065498352} +11/06/2021 22:29:23 - INFO - __main__ - Step 8913: {'lr': 0.0004973139471210051, 'samples': 1711296, 'steps': 8912, 'loss/train': 1.9860786199569702} +11/06/2021 22:29:24 - INFO - __main__ - Step 8914: {'lr': 0.0004973131712456717, 'samples': 1711488, 'steps': 8913, 'loss/train': 1.800611972808838} +11/06/2021 22:29:24 - INFO - __main__ - Step 8915: {'lr': 0.0004973123952589027, 'samples': 1711680, 'steps': 8914, 'loss/train': 2.1335561275482178} +11/06/2021 22:29:25 - INFO - __main__ - Step 8916: {'lr': 0.0004973116191606987, 'samples': 1711872, 'steps': 8915, 'loss/train': 2.246720552444458} +11/06/2021 22:29:25 - INFO - __main__ - Step 8917: {'lr': 0.0004973108429510598, 'samples': 1712064, 'steps': 8916, 'loss/train': 1.5170209407806396} +11/06/2021 22:29:26 - INFO - __main__ - Step 8918: {'lr': 0.0004973100666299864, 'samples': 1712256, 'steps': 8917, 'loss/train': 1.8479684591293335} +11/06/2021 22:29:26 - INFO - __main__ - Step 8919: {'lr': 0.000497309290197479, 'samples': 1712448, 'steps': 8918, 'loss/train': 1.6200121641159058} +11/06/2021 22:29:27 - INFO - __main__ - Step 8920: {'lr': 0.0004973085136535379, 'samples': 1712640, 'steps': 8919, 'loss/train': 1.8492422103881836} +11/06/2021 22:29:27 - INFO - __main__ - Step 8921: {'lr': 0.0004973077369981633, 'samples': 1712832, 'steps': 8920, 'loss/train': 1.80856192111969} +11/06/2021 22:29:28 - INFO - __main__ - Step 8922: {'lr': 0.0004973069602313557, 'samples': 1713024, 'steps': 8921, 'loss/train': 2.0224783420562744} +11/06/2021 22:29:28 - INFO - __main__ - Step 8923: {'lr': 0.0004973061833531154, 'samples': 1713216, 'steps': 8922, 'loss/train': 1.5250040292739868} +11/06/2021 22:29:28 - INFO - __main__ - Step 8924: {'lr': 0.0004973054063634428, 'samples': 1713408, 'steps': 8923, 'loss/train': 1.9554498195648193} +11/06/2021 22:29:29 - INFO - __main__ - Step 8925: {'lr': 0.0004973046292623382, 'samples': 1713600, 'steps': 8924, 'loss/train': 1.6448603868484497} +11/06/2021 22:29:30 - INFO - __main__ - Step 8926: {'lr': 0.0004973038520498017, 'samples': 1713792, 'steps': 8925, 'loss/train': 1.983763575553894} +11/06/2021 22:29:30 - INFO - __main__ - Step 8927: {'lr': 0.0004973030747258342, 'samples': 1713984, 'steps': 8926, 'loss/train': 1.5370417833328247} +11/06/2021 22:29:31 - INFO - __main__ - Step 8928: {'lr': 0.0004973022972904356, 'samples': 1714176, 'steps': 8927, 'loss/train': 2.2001898288726807} +11/06/2021 22:29:31 - INFO - __main__ - Step 8929: {'lr': 0.0004973015197436063, 'samples': 1714368, 'steps': 8928, 'loss/train': 3.589097023010254} +11/06/2021 22:29:31 - INFO - __main__ - Step 8930: {'lr': 0.0004973007420853471, 'samples': 1714560, 'steps': 8929, 'loss/train': 1.7380764484405518} +11/06/2021 22:29:32 - INFO - __main__ - Step 8931: {'lr': 0.0004972999643156577, 'samples': 1714752, 'steps': 8930, 'loss/train': 1.9435979127883911} +11/06/2021 22:29:33 - INFO - __main__ - Step 8932: {'lr': 0.0004972991864345389, 'samples': 1714944, 'steps': 8931, 'loss/train': 1.745599627494812} +11/06/2021 22:29:33 - INFO - __main__ - Step 8933: {'lr': 0.0004972984084419908, 'samples': 1715136, 'steps': 8932, 'loss/train': 1.9273251295089722} +11/06/2021 22:29:34 - INFO - __main__ - Step 8934: {'lr': 0.0004972976303380139, 'samples': 1715328, 'steps': 8933, 'loss/train': 1.3530958890914917} +11/06/2021 22:29:34 - INFO - __main__ - Step 8935: {'lr': 0.0004972968521226085, 'samples': 1715520, 'steps': 8934, 'loss/train': 2.121579885482788} +11/06/2021 22:29:34 - INFO - __main__ - Step 8936: {'lr': 0.0004972960737957749, 'samples': 1715712, 'steps': 8935, 'loss/train': 1.9268077611923218} +11/06/2021 22:29:35 - INFO - __main__ - Step 8937: {'lr': 0.0004972952953575136, 'samples': 1715904, 'steps': 8936, 'loss/train': 1.8524378538131714} +11/06/2021 22:29:36 - INFO - __main__ - Step 8938: {'lr': 0.0004972945168078248, 'samples': 1716096, 'steps': 8937, 'loss/train': 0.22625112533569336} +11/06/2021 22:29:36 - INFO - __main__ - Step 8939: {'lr': 0.000497293738146709, 'samples': 1716288, 'steps': 8938, 'loss/train': 1.5457402467727661} +11/06/2021 22:29:36 - INFO - __main__ - Step 8940: {'lr': 0.0004972929593741662, 'samples': 1716480, 'steps': 8939, 'loss/train': 1.9634605646133423} +11/06/2021 22:29:37 - INFO - __main__ - Step 8941: {'lr': 0.0004972921804901973, 'samples': 1716672, 'steps': 8940, 'loss/train': 1.6684246063232422} +11/06/2021 22:29:38 - INFO - __main__ - Step 8942: {'lr': 0.0004972914014948023, 'samples': 1716864, 'steps': 8941, 'loss/train': 2.112210512161255} +11/06/2021 22:29:38 - INFO - __main__ - Step 8943: {'lr': 0.0004972906223879815, 'samples': 1717056, 'steps': 8942, 'loss/train': 2.020785331726074} +11/06/2021 22:29:39 - INFO - __main__ - Step 8944: {'lr': 0.0004972898431697355, 'samples': 1717248, 'steps': 8943, 'loss/train': 1.4316191673278809} +11/06/2021 22:29:39 - INFO - __main__ - Step 8945: {'lr': 0.0004972890638400644, 'samples': 1717440, 'steps': 8944, 'loss/train': 3.3050966262817383} +11/06/2021 22:29:39 - INFO - __main__ - Step 8946: {'lr': 0.0004972882843989687, 'samples': 1717632, 'steps': 8945, 'loss/train': 1.6966694593429565} +11/06/2021 22:29:40 - INFO - __main__ - Step 8947: {'lr': 0.0004972875048464487, 'samples': 1717824, 'steps': 8946, 'loss/train': 1.5771774053573608} +11/06/2021 22:29:41 - INFO - __main__ - Step 8948: {'lr': 0.0004972867251825048, 'samples': 1718016, 'steps': 8947, 'loss/train': 2.001603841781616} +11/06/2021 22:29:41 - INFO - __main__ - Step 8949: {'lr': 0.0004972859454071373, 'samples': 1718208, 'steps': 8948, 'loss/train': 1.704656720161438} +11/06/2021 22:29:41 - INFO - __main__ - Step 8950: {'lr': 0.0004972851655203465, 'samples': 1718400, 'steps': 8949, 'loss/train': 2.2928240299224854} +11/06/2021 22:29:42 - INFO - __main__ - Step 8951: {'lr': 0.000497284385522133, 'samples': 1718592, 'steps': 8950, 'loss/train': 2.0876405239105225} +11/06/2021 22:29:42 - INFO - __main__ - Step 8952: {'lr': 0.0004972836054124968, 'samples': 1718784, 'steps': 8951, 'loss/train': 1.9462846517562866} +11/06/2021 22:29:43 - INFO - __main__ - Step 8953: {'lr': 0.0004972828251914384, 'samples': 1718976, 'steps': 8952, 'loss/train': 1.3022961616516113} +11/06/2021 22:29:43 - INFO - __main__ - Step 8954: {'lr': 0.0004972820448589584, 'samples': 1719168, 'steps': 8953, 'loss/train': 1.0215758085250854} +11/06/2021 22:29:44 - INFO - __main__ - Step 8955: {'lr': 0.0004972812644150567, 'samples': 1719360, 'steps': 8954, 'loss/train': 1.7224310636520386} +11/06/2021 22:29:44 - INFO - __main__ - Step 8956: {'lr': 0.000497280483859734, 'samples': 1719552, 'steps': 8955, 'loss/train': 1.3424328565597534} +11/06/2021 22:29:45 - INFO - __main__ - Step 8957: {'lr': 0.0004972797031929904, 'samples': 1719744, 'steps': 8956, 'loss/train': 1.9782111644744873} +11/06/2021 22:29:45 - INFO - __main__ - Step 8958: {'lr': 0.0004972789224148266, 'samples': 1719936, 'steps': 8957, 'loss/train': 2.0518736839294434} +11/06/2021 22:29:46 - INFO - __main__ - Step 8959: {'lr': 0.0004972781415252426, 'samples': 1720128, 'steps': 8958, 'loss/train': 2.4421885013580322} +11/06/2021 22:29:46 - INFO - __main__ - Step 8960: {'lr': 0.0004972773605242388, 'samples': 1720320, 'steps': 8959, 'loss/train': 1.4392913579940796} +11/06/2021 22:29:47 - INFO - __main__ - Step 8961: {'lr': 0.0004972765794118158, 'samples': 1720512, 'steps': 8960, 'loss/train': 1.1508708000183105} +11/06/2021 22:29:47 - INFO - __main__ - Step 8962: {'lr': 0.0004972757981879737, 'samples': 1720704, 'steps': 8961, 'loss/train': 1.7767452001571655} +11/06/2021 22:29:48 - INFO - __main__ - Step 8963: {'lr': 0.000497275016852713, 'samples': 1720896, 'steps': 8962, 'loss/train': 2.000983953475952} +11/06/2021 22:29:48 - INFO - __main__ - Step 8964: {'lr': 0.0004972742354060339, 'samples': 1721088, 'steps': 8963, 'loss/train': 1.6095494031906128} +11/06/2021 22:29:49 - INFO - __main__ - Step 8965: {'lr': 0.0004972734538479369, 'samples': 1721280, 'steps': 8964, 'loss/train': 2.106870174407959} +11/06/2021 22:29:49 - INFO - __main__ - Step 8966: {'lr': 0.0004972726721784223, 'samples': 1721472, 'steps': 8965, 'loss/train': 1.3510915040969849} +11/06/2021 22:29:49 - INFO - __main__ - Step 8967: {'lr': 0.0004972718903974904, 'samples': 1721664, 'steps': 8966, 'loss/train': 2.6114096641540527} +11/06/2021 22:29:50 - INFO - __main__ - Step 8968: {'lr': 0.0004972711085051417, 'samples': 1721856, 'steps': 8967, 'loss/train': 1.257983922958374} +11/06/2021 22:29:51 - INFO - __main__ - Step 8969: {'lr': 0.0004972703265013764, 'samples': 1722048, 'steps': 8968, 'loss/train': 1.7631484270095825} +11/06/2021 22:29:51 - INFO - __main__ - Step 8970: {'lr': 0.0004972695443861949, 'samples': 1722240, 'steps': 8969, 'loss/train': 1.826780080795288} +11/06/2021 22:29:51 - INFO - __main__ - Step 8971: {'lr': 0.0004972687621595975, 'samples': 1722432, 'steps': 8970, 'loss/train': 1.8841552734375} +11/06/2021 22:29:52 - INFO - __main__ - Step 8972: {'lr': 0.0004972679798215847, 'samples': 1722624, 'steps': 8971, 'loss/train': 1.433433175086975} +11/06/2021 22:29:53 - INFO - __main__ - Step 8973: {'lr': 0.0004972671973721567, 'samples': 1722816, 'steps': 8972, 'loss/train': 1.9559110403060913} +11/06/2021 22:29:53 - INFO - __main__ - Step 8974: {'lr': 0.000497266414811314, 'samples': 1723008, 'steps': 8973, 'loss/train': 2.148409605026245} +11/06/2021 22:29:54 - INFO - __main__ - Step 8975: {'lr': 0.0004972656321390568, 'samples': 1723200, 'steps': 8974, 'loss/train': 1.603281855583191} +11/06/2021 22:29:54 - INFO - __main__ - Step 8976: {'lr': 0.0004972648493553856, 'samples': 1723392, 'steps': 8975, 'loss/train': 1.3855030536651611} +11/06/2021 22:29:54 - INFO - __main__ - Step 8977: {'lr': 0.0004972640664603006, 'samples': 1723584, 'steps': 8976, 'loss/train': 1.4343771934509277} +11/06/2021 22:29:55 - INFO - __main__ - Step 8978: {'lr': 0.0004972632834538023, 'samples': 1723776, 'steps': 8977, 'loss/train': 1.4176015853881836} +11/06/2021 22:29:56 - INFO - __main__ - Step 8979: {'lr': 0.0004972625003358908, 'samples': 1723968, 'steps': 8978, 'loss/train': 1.4474366903305054} +11/06/2021 22:29:56 - INFO - __main__ - Step 8980: {'lr': 0.0004972617171065668, 'samples': 1724160, 'steps': 8979, 'loss/train': 0.7004616260528564} +11/06/2021 22:29:56 - INFO - __main__ - Step 8981: {'lr': 0.0004972609337658305, 'samples': 1724352, 'steps': 8980, 'loss/train': 1.7616783380508423} +11/06/2021 22:29:57 - INFO - __main__ - Step 8982: {'lr': 0.0004972601503136822, 'samples': 1724544, 'steps': 8981, 'loss/train': 1.6659023761749268} +11/06/2021 22:29:57 - INFO - __main__ - Step 8983: {'lr': 0.0004972593667501222, 'samples': 1724736, 'steps': 8982, 'loss/train': 1.7344557046890259} +11/06/2021 22:29:58 - INFO - __main__ - Step 8984: {'lr': 0.0004972585830751511, 'samples': 1724928, 'steps': 8983, 'loss/train': 1.725408673286438} +11/06/2021 22:29:59 - INFO - __main__ - Step 8985: {'lr': 0.0004972577992887689, 'samples': 1725120, 'steps': 8984, 'loss/train': 1.803905725479126} +11/06/2021 22:29:59 - INFO - __main__ - Step 8986: {'lr': 0.0004972570153909763, 'samples': 1725312, 'steps': 8985, 'loss/train': 2.232513427734375} +11/06/2021 22:29:59 - INFO - __main__ - Step 8987: {'lr': 0.0004972562313817735, 'samples': 1725504, 'steps': 8986, 'loss/train': 0.8127360343933105} +11/06/2021 22:30:00 - INFO - __main__ - Step 8988: {'lr': 0.0004972554472611609, 'samples': 1725696, 'steps': 8987, 'loss/train': 2.031003713607788} +11/06/2021 22:30:01 - INFO - __main__ - Step 8989: {'lr': 0.0004972546630291387, 'samples': 1725888, 'steps': 8988, 'loss/train': 1.9944013357162476} +11/06/2021 22:30:01 - INFO - __main__ - Step 8990: {'lr': 0.0004972538786857073, 'samples': 1726080, 'steps': 8989, 'loss/train': 2.087233781814575} +11/06/2021 22:30:01 - INFO - __main__ - Step 8991: {'lr': 0.0004972530942308673, 'samples': 1726272, 'steps': 8990, 'loss/train': 2.0797486305236816} +11/06/2021 22:30:02 - INFO - __main__ - Step 8992: {'lr': 0.0004972523096646188, 'samples': 1726464, 'steps': 8991, 'loss/train': 1.4353597164154053} +11/06/2021 22:30:02 - INFO - __main__ - Step 8993: {'lr': 0.0004972515249869622, 'samples': 1726656, 'steps': 8992, 'loss/train': 1.706042766571045} +11/06/2021 22:30:03 - INFO - __main__ - Step 8994: {'lr': 0.000497250740197898, 'samples': 1726848, 'steps': 8993, 'loss/train': 1.5139485597610474} +11/06/2021 22:30:04 - INFO - __main__ - Step 8995: {'lr': 0.0004972499552974263, 'samples': 1727040, 'steps': 8994, 'loss/train': 1.8484820127487183} +11/06/2021 22:30:04 - INFO - __main__ - Step 8996: {'lr': 0.0004972491702855477, 'samples': 1727232, 'steps': 8995, 'loss/train': 1.559495210647583} +11/06/2021 22:30:04 - INFO - __main__ - Step 8997: {'lr': 0.0004972483851622623, 'samples': 1727424, 'steps': 8996, 'loss/train': 2.627495527267456} +11/06/2021 22:30:05 - INFO - __main__ - Step 8998: {'lr': 0.0004972475999275707, 'samples': 1727616, 'steps': 8997, 'loss/train': 1.676787257194519} +11/06/2021 22:30:06 - INFO - __main__ - Step 8999: {'lr': 0.0004972468145814729, 'samples': 1727808, 'steps': 8998, 'loss/train': 1.9144270420074463} +11/06/2021 22:30:06 - INFO - __main__ - Step 9000: {'lr': 0.0004972460291239697, 'samples': 1728000, 'steps': 8999, 'loss/train': 2.2997002601623535} +11/06/2021 22:30:06 - INFO - __main__ - Step 9001: {'lr': 0.0004972452435550613, 'samples': 1728192, 'steps': 9000, 'loss/train': 1.8456697463989258} +11/06/2021 22:30:07 - INFO - __main__ - Step 9002: {'lr': 0.000497244457874748, 'samples': 1728384, 'steps': 9001, 'loss/train': 1.736275315284729} +11/06/2021 22:30:07 - INFO - __main__ - Step 9003: {'lr': 0.0004972436720830301, 'samples': 1728576, 'steps': 9002, 'loss/train': 1.504355549812317} +11/06/2021 22:30:08 - INFO - __main__ - Step 9004: {'lr': 0.000497242886179908, 'samples': 1728768, 'steps': 9003, 'loss/train': 1.5996493101119995} +11/06/2021 22:30:08 - INFO - __main__ - Step 9005: {'lr': 0.0004972421001653822, 'samples': 1728960, 'steps': 9004, 'loss/train': 1.5102970600128174} +11/06/2021 22:30:09 - INFO - __main__ - Step 9006: {'lr': 0.0004972413140394528, 'samples': 1729152, 'steps': 9005, 'loss/train': 2.118058204650879} +11/06/2021 22:30:09 - INFO - __main__ - Step 9007: {'lr': 0.0004972405278021203, 'samples': 1729344, 'steps': 9006, 'loss/train': 2.190336227416992} +11/06/2021 22:30:09 - INFO - __main__ - Step 9008: {'lr': 0.000497239741453385, 'samples': 1729536, 'steps': 9007, 'loss/train': 1.8450963497161865} +11/06/2021 22:30:10 - INFO - __main__ - Step 9009: {'lr': 0.0004972389549932473, 'samples': 1729728, 'steps': 9008, 'loss/train': 2.0399389266967773} +11/06/2021 22:30:11 - INFO - __main__ - Step 9010: {'lr': 0.0004972381684217077, 'samples': 1729920, 'steps': 9009, 'loss/train': 1.8316234350204468} +11/06/2021 22:30:11 - INFO - __main__ - Step 9011: {'lr': 0.0004972373817387662, 'samples': 1730112, 'steps': 9010, 'loss/train': 0.9349846839904785} +11/06/2021 22:30:11 - INFO - __main__ - Step 9012: {'lr': 0.0004972365949444234, 'samples': 1730304, 'steps': 9011, 'loss/train': 1.6661643981933594} +11/06/2021 22:30:12 - INFO - __main__ - Step 9013: {'lr': 0.0004972358080386796, 'samples': 1730496, 'steps': 9012, 'loss/train': 1.3828058242797852} +11/06/2021 22:30:12 - INFO - __main__ - Step 9014: {'lr': 0.0004972350210215353, 'samples': 1730688, 'steps': 9013, 'loss/train': 1.3896691799163818} +11/06/2021 22:30:13 - INFO - __main__ - Step 9015: {'lr': 0.0004972342338929906, 'samples': 1730880, 'steps': 9014, 'loss/train': 1.6471271514892578} +11/06/2021 22:30:13 - INFO - __main__ - Step 9016: {'lr': 0.000497233446653046, 'samples': 1731072, 'steps': 9015, 'loss/train': 1.893143892288208} +11/06/2021 22:30:14 - INFO - __main__ - Step 9017: {'lr': 0.0004972326593017017, 'samples': 1731264, 'steps': 9016, 'loss/train': 1.5417567491531372} +11/06/2021 22:30:14 - INFO - __main__ - Step 9018: {'lr': 0.0004972318718389583, 'samples': 1731456, 'steps': 9017, 'loss/train': 2.1753854751586914} +11/06/2021 22:30:14 - INFO - __main__ - Step 9019: {'lr': 0.000497231084264816, 'samples': 1731648, 'steps': 9018, 'loss/train': 1.7801073789596558} +11/06/2021 22:30:16 - INFO - __main__ - Step 9020: {'lr': 0.0004972302965792752, 'samples': 1731840, 'steps': 9019, 'loss/train': 1.927689790725708} +11/06/2021 22:30:16 - INFO - __main__ - Step 9021: {'lr': 0.0004972295087823362, 'samples': 1732032, 'steps': 9020, 'loss/train': 1.54207444190979} +11/06/2021 22:30:16 - INFO - __main__ - Step 9022: {'lr': 0.0004972287208739995, 'samples': 1732224, 'steps': 9021, 'loss/train': 1.5854400396347046} +11/06/2021 22:30:17 - INFO - __main__ - Step 9023: {'lr': 0.0004972279328542652, 'samples': 1732416, 'steps': 9022, 'loss/train': 2.2019128799438477} +11/06/2021 22:30:17 - INFO - __main__ - Step 9024: {'lr': 0.000497227144723134, 'samples': 1732608, 'steps': 9023, 'loss/train': 1.814888596534729} +11/06/2021 22:30:18 - INFO - __main__ - Step 9025: {'lr': 0.0004972263564806059, 'samples': 1732800, 'steps': 9024, 'loss/train': 2.2460262775421143} +11/06/2021 22:30:18 - INFO - __main__ - Step 9026: {'lr': 0.0004972255681266816, 'samples': 1732992, 'steps': 9025, 'loss/train': 2.0175039768218994} +11/06/2021 22:30:19 - INFO - __main__ - Step 9027: {'lr': 0.0004972247796613611, 'samples': 1733184, 'steps': 9026, 'loss/train': 1.2223052978515625} +11/06/2021 22:30:19 - INFO - __main__ - Step 9028: {'lr': 0.000497223991084645, 'samples': 1733376, 'steps': 9027, 'loss/train': 1.550275206565857} +11/06/2021 22:30:19 - INFO - __main__ - Step 9029: {'lr': 0.0004972232023965335, 'samples': 1733568, 'steps': 9028, 'loss/train': 1.8038307428359985} +11/06/2021 22:30:20 - INFO - __main__ - Step 9030: {'lr': 0.0004972224135970271, 'samples': 1733760, 'steps': 9029, 'loss/train': 1.7093403339385986} +11/06/2021 22:30:21 - INFO - __main__ - Step 9031: {'lr': 0.0004972216246861262, 'samples': 1733952, 'steps': 9030, 'loss/train': 2.1160690784454346} +11/06/2021 22:30:21 - INFO - __main__ - Step 9032: {'lr': 0.0004972208356638309, 'samples': 1734144, 'steps': 9031, 'loss/train': 0.9576528072357178} +11/06/2021 22:30:21 - INFO - __main__ - Step 9033: {'lr': 0.0004972200465301418, 'samples': 1734336, 'steps': 9032, 'loss/train': 2.587282657623291} +11/06/2021 22:30:22 - INFO - __main__ - Step 9034: {'lr': 0.0004972192572850592, 'samples': 1734528, 'steps': 9033, 'loss/train': 1.5511127710342407} +11/06/2021 22:30:22 - INFO - __main__ - Step 9035: {'lr': 0.0004972184679285833, 'samples': 1734720, 'steps': 9034, 'loss/train': 1.6166201829910278} +11/06/2021 22:30:23 - INFO - __main__ - Step 9036: {'lr': 0.0004972176784607146, 'samples': 1734912, 'steps': 9035, 'loss/train': 1.4050244092941284} +11/06/2021 22:30:24 - INFO - __main__ - Step 9037: {'lr': 0.0004972168888814533, 'samples': 1735104, 'steps': 9036, 'loss/train': 2.019019842147827} +11/06/2021 22:30:24 - INFO - __main__ - Step 9038: {'lr': 0.0004972160991908001, 'samples': 1735296, 'steps': 9037, 'loss/train': 1.9093737602233887} +11/06/2021 22:30:24 - INFO - __main__ - Step 9039: {'lr': 0.0004972153093887551, 'samples': 1735488, 'steps': 9038, 'loss/train': 1.671932578086853} +11/06/2021 22:30:25 - INFO - __main__ - Step 9040: {'lr': 0.0004972145194753186, 'samples': 1735680, 'steps': 9039, 'loss/train': 1.3389232158660889} +11/06/2021 22:30:26 - INFO - __main__ - Step 9041: {'lr': 0.0004972137294504912, 'samples': 1735872, 'steps': 9040, 'loss/train': 2.4330387115478516} +11/06/2021 22:30:26 - INFO - __main__ - Step 9042: {'lr': 0.000497212939314273, 'samples': 1736064, 'steps': 9041, 'loss/train': 1.3045024871826172} +11/06/2021 22:30:26 - INFO - __main__ - Step 9043: {'lr': 0.0004972121490666644, 'samples': 1736256, 'steps': 9042, 'loss/train': 1.6939752101898193} +11/06/2021 22:30:27 - INFO - __main__ - Step 9044: {'lr': 0.000497211358707666, 'samples': 1736448, 'steps': 9043, 'loss/train': 1.862133502960205} +11/06/2021 22:30:27 - INFO - __main__ - Step 9045: {'lr': 0.0004972105682372779, 'samples': 1736640, 'steps': 9044, 'loss/train': 2.044528007507324} +11/06/2021 22:30:29 - INFO - __main__ - Step 9046: {'lr': 0.0004972097776555005, 'samples': 1736832, 'steps': 9045, 'loss/train': 1.8090245723724365} +11/06/2021 22:30:29 - INFO - __main__ - Step 9047: {'lr': 0.0004972089869623342, 'samples': 1737024, 'steps': 9046, 'loss/train': 1.5942614078521729} +11/06/2021 22:30:29 - INFO - __main__ - Step 9048: {'lr': 0.0004972081961577793, 'samples': 1737216, 'steps': 9047, 'loss/train': 2.0264124870300293} +11/06/2021 22:30:30 - INFO - __main__ - Step 9049: {'lr': 0.0004972074052418363, 'samples': 1737408, 'steps': 9048, 'loss/train': 1.723054051399231} +11/06/2021 22:30:30 - INFO - __main__ - Step 9050: {'lr': 0.0004972066142145055, 'samples': 1737600, 'steps': 9049, 'loss/train': 1.216286540031433} +11/06/2021 22:30:30 - INFO - __main__ - Step 9051: {'lr': 0.0004972058230757871, 'samples': 1737792, 'steps': 9050, 'loss/train': 1.870058536529541} +11/06/2021 22:30:31 - INFO - __main__ - Step 9052: {'lr': 0.0004972050318256815, 'samples': 1737984, 'steps': 9051, 'loss/train': 0.3041784465312958} +11/06/2021 22:30:32 - INFO - __main__ - Step 9053: {'lr': 0.0004972042404641893, 'samples': 1738176, 'steps': 9052, 'loss/train': 1.6829752922058105} +11/06/2021 22:30:32 - INFO - __main__ - Step 9054: {'lr': 0.0004972034489913106, 'samples': 1738368, 'steps': 9053, 'loss/train': 1.7771741151809692} +11/06/2021 22:30:32 - INFO - __main__ - Step 9055: {'lr': 0.0004972026574070459, 'samples': 1738560, 'steps': 9054, 'loss/train': 2.233604907989502} +11/06/2021 22:30:33 - INFO - __main__ - Step 9056: {'lr': 0.0004972018657113953, 'samples': 1738752, 'steps': 9055, 'loss/train': 2.35441517829895} +11/06/2021 22:30:34 - INFO - __main__ - Step 9057: {'lr': 0.0004972010739043596, 'samples': 1738944, 'steps': 9056, 'loss/train': 1.8315443992614746} +11/06/2021 22:30:34 - INFO - __main__ - Step 9058: {'lr': 0.0004972002819859388, 'samples': 1739136, 'steps': 9057, 'loss/train': 1.4996757507324219} +11/06/2021 22:30:34 - INFO - __main__ - Step 9059: {'lr': 0.0004971994899561334, 'samples': 1739328, 'steps': 9058, 'loss/train': 2.07483172416687} +11/06/2021 22:30:35 - INFO - __main__ - Step 9060: {'lr': 0.0004971986978149437, 'samples': 1739520, 'steps': 9059, 'loss/train': 1.568691372871399} +11/06/2021 22:30:35 - INFO - __main__ - Step 9061: {'lr': 0.0004971979055623701, 'samples': 1739712, 'steps': 9060, 'loss/train': 1.295201063156128} +11/06/2021 22:30:36 - INFO - __main__ - Step 9062: {'lr': 0.0004971971131984129, 'samples': 1739904, 'steps': 9061, 'loss/train': 2.6647539138793945} +11/06/2021 22:30:37 - INFO - __main__ - Step 9063: {'lr': 0.0004971963207230725, 'samples': 1740096, 'steps': 9062, 'loss/train': 1.6942551136016846} +11/06/2021 22:30:37 - INFO - __main__ - Step 9064: {'lr': 0.0004971955281363493, 'samples': 1740288, 'steps': 9063, 'loss/train': 1.9272085428237915} +11/06/2021 22:30:37 - INFO - __main__ - Step 9065: {'lr': 0.0004971947354382436, 'samples': 1740480, 'steps': 9064, 'loss/train': 1.482258677482605} +11/06/2021 22:30:38 - INFO - __main__ - Step 9066: {'lr': 0.0004971939426287557, 'samples': 1740672, 'steps': 9065, 'loss/train': 2.1765670776367188} +11/06/2021 22:30:39 - INFO - __main__ - Step 9067: {'lr': 0.0004971931497078861, 'samples': 1740864, 'steps': 9066, 'loss/train': 1.9422248601913452} +11/06/2021 22:30:39 - INFO - __main__ - Step 9068: {'lr': 0.000497192356675635, 'samples': 1741056, 'steps': 9067, 'loss/train': 0.8091076612472534} +11/06/2021 22:30:39 - INFO - __main__ - Step 9069: {'lr': 0.0004971915635320029, 'samples': 1741248, 'steps': 9068, 'loss/train': 2.0615551471710205} +11/06/2021 22:30:40 - INFO - __main__ - Step 9070: {'lr': 0.0004971907702769901, 'samples': 1741440, 'steps': 9069, 'loss/train': 1.8505113124847412} +11/06/2021 22:30:40 - INFO - __main__ - Step 9071: {'lr': 0.000497189976910597, 'samples': 1741632, 'steps': 9070, 'loss/train': 2.2380783557891846} +11/06/2021 22:30:41 - INFO - __main__ - Step 9072: {'lr': 0.0004971891834328238, 'samples': 1741824, 'steps': 9071, 'loss/train': 0.3026748597621918} +11/06/2021 22:30:41 - INFO - __main__ - Step 9073: {'lr': 0.000497188389843671, 'samples': 1742016, 'steps': 9072, 'loss/train': 1.1784673929214478} +11/06/2021 22:30:42 - INFO - __main__ - Step 9074: {'lr': 0.0004971875961431389, 'samples': 1742208, 'steps': 9073, 'loss/train': 1.7177537679672241} +11/06/2021 22:30:42 - INFO - __main__ - Step 9075: {'lr': 0.000497186802331228, 'samples': 1742400, 'steps': 9074, 'loss/train': 2.291787624359131} +11/06/2021 22:30:43 - INFO - __main__ - Step 9076: {'lr': 0.0004971860084079385, 'samples': 1742592, 'steps': 9075, 'loss/train': 1.1271553039550781} +11/06/2021 22:30:43 - INFO - __main__ - Step 9077: {'lr': 0.0004971852143732707, 'samples': 1742784, 'steps': 9076, 'loss/train': 1.6700618267059326} +11/06/2021 22:30:44 - INFO - __main__ - Step 9078: {'lr': 0.0004971844202272251, 'samples': 1742976, 'steps': 9077, 'loss/train': 1.7252506017684937} +11/06/2021 22:30:44 - INFO - __main__ - Step 9079: {'lr': 0.000497183625969802, 'samples': 1743168, 'steps': 9078, 'loss/train': 1.921452283859253} +11/06/2021 22:30:45 - INFO - __main__ - Step 9080: {'lr': 0.0004971828316010019, 'samples': 1743360, 'steps': 9079, 'loss/train': 1.8389270305633545} +11/06/2021 22:30:45 - INFO - __main__ - Step 9081: {'lr': 0.0004971820371208248, 'samples': 1743552, 'steps': 9080, 'loss/train': 1.7379286289215088} +11/06/2021 22:30:45 - INFO - __main__ - Step 9082: {'lr': 0.0004971812425292716, 'samples': 1743744, 'steps': 9081, 'loss/train': 2.1627986431121826} +11/06/2021 22:30:46 - INFO - __main__ - Step 9083: {'lr': 0.000497180447826342, 'samples': 1743936, 'steps': 9082, 'loss/train': 1.5003117322921753} +11/06/2021 22:30:47 - INFO - __main__ - Step 9084: {'lr': 0.0004971796530120371, 'samples': 1744128, 'steps': 9083, 'loss/train': 1.885785460472107} +11/06/2021 22:30:47 - INFO - __main__ - Step 9085: {'lr': 0.0004971788580863566, 'samples': 1744320, 'steps': 9084, 'loss/train': 1.6980434656143188} +11/06/2021 22:30:47 - INFO - __main__ - Step 9086: {'lr': 0.0004971780630493012, 'samples': 1744512, 'steps': 9085, 'loss/train': 1.8362492322921753} +11/06/2021 22:30:48 - INFO - __main__ - Step 9087: {'lr': 0.000497177267900871, 'samples': 1744704, 'steps': 9086, 'loss/train': 1.9315646886825562} +11/06/2021 22:30:49 - INFO - __main__ - Step 9088: {'lr': 0.0004971764726410668, 'samples': 1744896, 'steps': 9087, 'loss/train': 1.8160526752471924} +11/06/2021 22:30:49 - INFO - __main__ - Step 9089: {'lr': 0.0004971756772698886, 'samples': 1745088, 'steps': 9088, 'loss/train': 1.7330033779144287} +11/06/2021 22:30:50 - INFO - __main__ - Step 9090: {'lr': 0.0004971748817873367, 'samples': 1745280, 'steps': 9089, 'loss/train': 1.8694642782211304} +11/06/2021 22:30:50 - INFO - __main__ - Step 9091: {'lr': 0.0004971740861934117, 'samples': 1745472, 'steps': 9090, 'loss/train': 1.788362741470337} +11/06/2021 22:30:50 - INFO - __main__ - Step 9092: {'lr': 0.000497173290488114, 'samples': 1745664, 'steps': 9091, 'loss/train': 1.6177334785461426} +11/06/2021 22:30:52 - INFO - __main__ - Step 9093: {'lr': 0.0004971724946714437, 'samples': 1745856, 'steps': 9092, 'loss/train': 1.626973032951355} +11/06/2021 22:30:52 - INFO - __main__ - Step 9094: {'lr': 0.0004971716987434014, 'samples': 1746048, 'steps': 9093, 'loss/train': 1.3091498613357544} +11/06/2021 22:30:52 - INFO - __main__ - Step 9095: {'lr': 0.0004971709027039872, 'samples': 1746240, 'steps': 9094, 'loss/train': 1.3420382738113403} +11/06/2021 22:30:53 - INFO - __main__ - Step 9096: {'lr': 0.0004971701065532017, 'samples': 1746432, 'steps': 9095, 'loss/train': 1.4940237998962402} +11/06/2021 22:30:53 - INFO - __main__ - Step 9097: {'lr': 0.0004971693102910451, 'samples': 1746624, 'steps': 9096, 'loss/train': 2.1180343627929688} +11/06/2021 22:30:53 - INFO - __main__ - Step 9098: {'lr': 0.0004971685139175179, 'samples': 1746816, 'steps': 9097, 'loss/train': 2.4166030883789062} +11/06/2021 22:30:54 - INFO - __main__ - Step 9099: {'lr': 0.0004971677174326204, 'samples': 1747008, 'steps': 9098, 'loss/train': 5.840542316436768} +11/06/2021 22:30:55 - INFO - __main__ - Step 9100: {'lr': 0.0004971669208363529, 'samples': 1747200, 'steps': 9099, 'loss/train': 5.970412731170654} +11/06/2021 22:30:55 - INFO - __main__ - Step 9101: {'lr': 0.0004971661241287157, 'samples': 1747392, 'steps': 9100, 'loss/train': 2.0452849864959717} +11/06/2021 22:30:55 - INFO - __main__ - Step 9102: {'lr': 0.0004971653273097094, 'samples': 1747584, 'steps': 9101, 'loss/train': 1.074893593788147} +11/06/2021 22:30:56 - INFO - __main__ - Step 9103: {'lr': 0.0004971645303793342, 'samples': 1747776, 'steps': 9102, 'loss/train': 1.511845588684082} +11/06/2021 22:30:56 - INFO - __main__ - Step 9104: {'lr': 0.0004971637333375904, 'samples': 1747968, 'steps': 9103, 'loss/train': 1.4513171911239624} +11/06/2021 22:30:57 - INFO - __main__ - Step 9105: {'lr': 0.0004971629361844785, 'samples': 1748160, 'steps': 9104, 'loss/train': 1.3599135875701904} +11/06/2021 22:30:58 - INFO - __main__ - Step 9106: {'lr': 0.0004971621389199988, 'samples': 1748352, 'steps': 9105, 'loss/train': 1.6643626689910889} +11/06/2021 22:30:58 - INFO - __main__ - Step 9107: {'lr': 0.0004971613415441516, 'samples': 1748544, 'steps': 9106, 'loss/train': 1.0446491241455078} +11/06/2021 22:30:58 - INFO - __main__ - Step 9108: {'lr': 0.0004971605440569374, 'samples': 1748736, 'steps': 9107, 'loss/train': 1.783698558807373} +11/06/2021 22:30:59 - INFO - __main__ - Step 9109: {'lr': 0.0004971597464583563, 'samples': 1748928, 'steps': 9108, 'loss/train': 1.7281625270843506} +11/06/2021 22:31:00 - INFO - __main__ - Step 9110: {'lr': 0.0004971589487484091, 'samples': 1749120, 'steps': 9109, 'loss/train': 1.642425537109375} +11/06/2021 22:31:00 - INFO - __main__ - Step 9111: {'lr': 0.0004971581509270956, 'samples': 1749312, 'steps': 9110, 'loss/train': 1.2902659177780151} +11/06/2021 22:31:01 - INFO - __main__ - Step 9112: {'lr': 0.0004971573529944167, 'samples': 1749504, 'steps': 9111, 'loss/train': 2.028707981109619} +11/06/2021 22:31:01 - INFO - __main__ - Step 9113: {'lr': 0.0004971565549503723, 'samples': 1749696, 'steps': 9112, 'loss/train': 2.295679807662964} +11/06/2021 22:31:01 - INFO - __main__ - Step 9114: {'lr': 0.0004971557567949631, 'samples': 1749888, 'steps': 9113, 'loss/train': 1.6835025548934937} +11/06/2021 22:31:02 - INFO - __main__ - Step 9115: {'lr': 0.0004971549585281893, 'samples': 1750080, 'steps': 9114, 'loss/train': 1.3464192152023315} +11/06/2021 22:31:03 - INFO - __main__ - Step 9116: {'lr': 0.0004971541601500513, 'samples': 1750272, 'steps': 9115, 'loss/train': 1.7078288793563843} +11/06/2021 22:31:03 - INFO - __main__ - Step 9117: {'lr': 0.0004971533616605495, 'samples': 1750464, 'steps': 9116, 'loss/train': 1.4062687158584595} +11/06/2021 22:31:03 - INFO - __main__ - Step 9118: {'lr': 0.0004971525630596841, 'samples': 1750656, 'steps': 9117, 'loss/train': 1.889479637145996} +11/06/2021 22:31:04 - INFO - __main__ - Step 9119: {'lr': 0.0004971517643474556, 'samples': 1750848, 'steps': 9118, 'loss/train': 2.2042081356048584} +11/06/2021 22:31:04 - INFO - __main__ - Step 9120: {'lr': 0.0004971509655238643, 'samples': 1751040, 'steps': 9119, 'loss/train': 1.9173781871795654} +11/06/2021 22:31:05 - INFO - __main__ - Step 9121: {'lr': 0.0004971501665889107, 'samples': 1751232, 'steps': 9120, 'loss/train': 1.5485329627990723} +11/06/2021 22:31:05 - INFO - __main__ - Step 9122: {'lr': 0.000497149367542595, 'samples': 1751424, 'steps': 9121, 'loss/train': 2.2474119663238525} +11/06/2021 22:31:06 - INFO - __main__ - Step 9123: {'lr': 0.0004971485683849176, 'samples': 1751616, 'steps': 9122, 'loss/train': 1.9738703966140747} +11/06/2021 22:31:06 - INFO - __main__ - Step 9124: {'lr': 0.0004971477691158788, 'samples': 1751808, 'steps': 9123, 'loss/train': 1.9322994947433472} +11/06/2021 22:31:06 - INFO - __main__ - Step 9125: {'lr': 0.0004971469697354792, 'samples': 1752000, 'steps': 9124, 'loss/train': 2.1170740127563477} +11/06/2021 22:31:08 - INFO - __main__ - Step 9126: {'lr': 0.0004971461702437188, 'samples': 1752192, 'steps': 9125, 'loss/train': 1.9848999977111816} +11/06/2021 22:31:08 - INFO - __main__ - Step 9127: {'lr': 0.0004971453706405981, 'samples': 1752384, 'steps': 9126, 'loss/train': 1.6258814334869385} +11/06/2021 22:31:08 - INFO - __main__ - Step 9128: {'lr': 0.0004971445709261177, 'samples': 1752576, 'steps': 9127, 'loss/train': 1.3074932098388672} +11/06/2021 22:31:09 - INFO - __main__ - Step 9129: {'lr': 0.0004971437711002777, 'samples': 1752768, 'steps': 9128, 'loss/train': 1.880787968635559} +11/06/2021 22:31:09 - INFO - __main__ - Step 9130: {'lr': 0.0004971429711630786, 'samples': 1752960, 'steps': 9129, 'loss/train': 1.60108482837677} +11/06/2021 22:31:10 - INFO - __main__ - Step 9131: {'lr': 0.0004971421711145207, 'samples': 1753152, 'steps': 9130, 'loss/train': 1.9594632387161255} +11/06/2021 22:31:10 - INFO - __main__ - Step 9132: {'lr': 0.0004971413709546043, 'samples': 1753344, 'steps': 9131, 'loss/train': 1.4151302576065063} +11/06/2021 22:31:11 - INFO - __main__ - Step 9133: {'lr': 0.0004971405706833297, 'samples': 1753536, 'steps': 9132, 'loss/train': 2.054569721221924} +11/06/2021 22:31:11 - INFO - __main__ - Step 9134: {'lr': 0.0004971397703006974, 'samples': 1753728, 'steps': 9133, 'loss/train': 2.073517322540283} +11/06/2021 22:31:11 - INFO - __main__ - Step 9135: {'lr': 0.0004971389698067079, 'samples': 1753920, 'steps': 9134, 'loss/train': 2.4211151599884033} +11/06/2021 22:31:12 - INFO - __main__ - Step 9136: {'lr': 0.0004971381692013612, 'samples': 1754112, 'steps': 9135, 'loss/train': 1.4416491985321045} +11/06/2021 22:31:13 - INFO - __main__ - Step 9137: {'lr': 0.000497137368484658, 'samples': 1754304, 'steps': 9136, 'loss/train': 1.7312275171279907} +11/06/2021 22:31:13 - INFO - __main__ - Step 9138: {'lr': 0.0004971365676565984, 'samples': 1754496, 'steps': 9137, 'loss/train': 1.9141130447387695} +11/06/2021 22:31:13 - INFO - __main__ - Step 9139: {'lr': 0.000497135766717183, 'samples': 1754688, 'steps': 9138, 'loss/train': 1.8034145832061768} +11/06/2021 22:31:14 - INFO - __main__ - Step 9140: {'lr': 0.000497134965666412, 'samples': 1754880, 'steps': 9139, 'loss/train': 1.8870742321014404} +11/06/2021 22:31:14 - INFO - __main__ - Step 9141: {'lr': 0.0004971341645042857, 'samples': 1755072, 'steps': 9140, 'loss/train': 1.999513030052185} +11/06/2021 22:31:15 - INFO - __main__ - Step 9142: {'lr': 0.0004971333632308047, 'samples': 1755264, 'steps': 9141, 'loss/train': 2.0353739261627197} +11/06/2021 22:31:15 - INFO - __main__ - Step 9143: {'lr': 0.0004971325618459691, 'samples': 1755456, 'steps': 9142, 'loss/train': 2.1731367111206055} +11/06/2021 22:31:16 - INFO - __main__ - Step 9144: {'lr': 0.0004971317603497795, 'samples': 1755648, 'steps': 9143, 'loss/train': 1.4460906982421875} +11/06/2021 22:31:16 - INFO - __main__ - Step 9145: {'lr': 0.000497130958742236, 'samples': 1755840, 'steps': 9144, 'loss/train': 1.5800894498825073} +11/06/2021 22:31:17 - INFO - __main__ - Step 9146: {'lr': 0.0004971301570233392, 'samples': 1756032, 'steps': 9145, 'loss/train': 2.155123472213745} +11/06/2021 22:31:18 - INFO - __main__ - Step 9147: {'lr': 0.0004971293551930894, 'samples': 1756224, 'steps': 9146, 'loss/train': 1.0763784646987915} +11/06/2021 22:31:18 - INFO - __main__ - Step 9148: {'lr': 0.0004971285532514868, 'samples': 1756416, 'steps': 9147, 'loss/train': 1.7974958419799805} +11/06/2021 22:31:18 - INFO - __main__ - Step 9149: {'lr': 0.000497127751198532, 'samples': 1756608, 'steps': 9148, 'loss/train': 1.7774125337600708} +11/06/2021 22:31:19 - INFO - __main__ - Step 9150: {'lr': 0.0004971269490342252, 'samples': 1756800, 'steps': 9149, 'loss/train': 1.6433255672454834} +11/06/2021 22:31:19 - INFO - __main__ - Step 9151: {'lr': 0.0004971261467585669, 'samples': 1756992, 'steps': 9150, 'loss/train': 2.028750419616699} +11/06/2021 22:31:20 - INFO - __main__ - Step 9152: {'lr': 0.0004971253443715572, 'samples': 1757184, 'steps': 9151, 'loss/train': 1.2226204872131348} +11/06/2021 22:31:20 - INFO - __main__ - Step 9153: {'lr': 0.0004971245418731966, 'samples': 1757376, 'steps': 9152, 'loss/train': 2.202749490737915} +11/06/2021 22:31:21 - INFO - __main__ - Step 9154: {'lr': 0.0004971237392634857, 'samples': 1757568, 'steps': 9153, 'loss/train': 1.7844159603118896} +11/06/2021 22:31:21 - INFO - __main__ - Step 9155: {'lr': 0.0004971229365424246, 'samples': 1757760, 'steps': 9154, 'loss/train': 1.973191738128662} +11/06/2021 22:31:21 - INFO - __main__ - Step 9156: {'lr': 0.0004971221337100137, 'samples': 1757952, 'steps': 9155, 'loss/train': 1.785252332687378} +11/06/2021 22:31:23 - INFO - __main__ - Step 9157: {'lr': 0.0004971213307662534, 'samples': 1758144, 'steps': 9156, 'loss/train': 2.1560020446777344} +11/06/2021 22:31:23 - INFO - __main__ - Step 9158: {'lr': 0.000497120527711144, 'samples': 1758336, 'steps': 9157, 'loss/train': 1.1199406385421753} +11/06/2021 22:31:23 - INFO - __main__ - Step 9159: {'lr': 0.0004971197245446859, 'samples': 1758528, 'steps': 9158, 'loss/train': 2.273866891860962} +11/06/2021 22:31:24 - INFO - __main__ - Step 9160: {'lr': 0.0004971189212668794, 'samples': 1758720, 'steps': 9159, 'loss/train': 2.1585633754730225} +11/06/2021 22:31:24 - INFO - __main__ - Step 9161: {'lr': 0.0004971181178777251, 'samples': 1758912, 'steps': 9160, 'loss/train': 2.7556064128875732} +11/06/2021 22:31:24 - INFO - __main__ - Step 9162: {'lr': 0.0004971173143772231, 'samples': 1759104, 'steps': 9161, 'loss/train': 1.7603553533554077} +11/06/2021 22:31:25 - INFO - __main__ - Step 9163: {'lr': 0.0004971165107653738, 'samples': 1759296, 'steps': 9162, 'loss/train': 1.7750883102416992} +11/06/2021 22:31:26 - INFO - __main__ - Step 9164: {'lr': 0.0004971157070421776, 'samples': 1759488, 'steps': 9163, 'loss/train': 2.1838340759277344} +11/06/2021 22:31:26 - INFO - __main__ - Step 9165: {'lr': 0.000497114903207635, 'samples': 1759680, 'steps': 9164, 'loss/train': 2.311770439147949} +11/06/2021 22:31:26 - INFO - __main__ - Step 9166: {'lr': 0.0004971140992617462, 'samples': 1759872, 'steps': 9165, 'loss/train': 1.977513074874878} +11/06/2021 22:31:27 - INFO - __main__ - Step 9167: {'lr': 0.0004971132952045115, 'samples': 1760064, 'steps': 9166, 'loss/train': 1.9859895706176758} +11/06/2021 22:31:28 - INFO - __main__ - Step 9168: {'lr': 0.0004971124910359315, 'samples': 1760256, 'steps': 9167, 'loss/train': 1.7666734457015991} +11/06/2021 22:31:28 - INFO - __main__ - Step 9169: {'lr': 0.0004971116867560064, 'samples': 1760448, 'steps': 9168, 'loss/train': 1.7961926460266113} +11/06/2021 22:31:28 - INFO - __main__ - Step 9170: {'lr': 0.0004971108823647365, 'samples': 1760640, 'steps': 9169, 'loss/train': 1.904386281967163} +11/06/2021 22:31:29 - INFO - __main__ - Step 9171: {'lr': 0.0004971100778621223, 'samples': 1760832, 'steps': 9170, 'loss/train': 1.477123498916626} +11/06/2021 22:31:29 - INFO - __main__ - Step 9172: {'lr': 0.0004971092732481641, 'samples': 1761024, 'steps': 9171, 'loss/train': 1.5037059783935547} +11/06/2021 22:31:30 - INFO - __main__ - Step 9173: {'lr': 0.0004971084685228623, 'samples': 1761216, 'steps': 9172, 'loss/train': 1.8202991485595703} +11/06/2021 22:31:30 - INFO - __main__ - Step 9174: {'lr': 0.0004971076636862172, 'samples': 1761408, 'steps': 9173, 'loss/train': 1.7181813716888428} +11/06/2021 22:31:31 - INFO - __main__ - Step 9175: {'lr': 0.0004971068587382293, 'samples': 1761600, 'steps': 9174, 'loss/train': 1.4500627517700195} +11/06/2021 22:31:31 - INFO - __main__ - Step 9176: {'lr': 0.0004971060536788988, 'samples': 1761792, 'steps': 9175, 'loss/train': 1.9381426572799683} +11/06/2021 22:31:31 - INFO - __main__ - Step 9177: {'lr': 0.000497105248508226, 'samples': 1761984, 'steps': 9176, 'loss/train': 1.841038465499878} +11/06/2021 22:31:33 - INFO - __main__ - Step 9178: {'lr': 0.0004971044432262115, 'samples': 1762176, 'steps': 9177, 'loss/train': 1.351794958114624} +11/06/2021 22:31:33 - INFO - __main__ - Step 9179: {'lr': 0.0004971036378328556, 'samples': 1762368, 'steps': 9178, 'loss/train': 1.7219154834747314} +11/06/2021 22:31:33 - INFO - __main__ - Step 9180: {'lr': 0.0004971028323281586, 'samples': 1762560, 'steps': 9179, 'loss/train': 2.6767475605010986} +11/06/2021 22:31:34 - INFO - __main__ - Step 9181: {'lr': 0.0004971020267121208, 'samples': 1762752, 'steps': 9180, 'loss/train': 2.2747514247894287} +11/06/2021 22:31:34 - INFO - __main__ - Step 9182: {'lr': 0.0004971012209847427, 'samples': 1762944, 'steps': 9181, 'loss/train': 1.0986586809158325} +11/06/2021 22:31:35 - INFO - __main__ - Step 9183: {'lr': 0.0004971004151460245, 'samples': 1763136, 'steps': 9182, 'loss/train': 1.2503761053085327} +11/06/2021 22:31:35 - INFO - __main__ - Step 9184: {'lr': 0.0004970996091959668, 'samples': 1763328, 'steps': 9183, 'loss/train': 1.487623691558838} +11/06/2021 22:31:36 - INFO - __main__ - Step 9185: {'lr': 0.0004970988031345698, 'samples': 1763520, 'steps': 9184, 'loss/train': 1.718331217765808} +11/06/2021 22:31:36 - INFO - __main__ - Step 9186: {'lr': 0.0004970979969618338, 'samples': 1763712, 'steps': 9185, 'loss/train': 1.1969623565673828} +11/06/2021 22:31:36 - INFO - __main__ - Step 9187: {'lr': 0.0004970971906777593, 'samples': 1763904, 'steps': 9186, 'loss/train': 1.9592634439468384} +11/06/2021 22:31:37 - INFO - __main__ - Step 9188: {'lr': 0.0004970963842823468, 'samples': 1764096, 'steps': 9187, 'loss/train': 1.1920486688613892} +11/06/2021 22:31:38 - INFO - __main__ - Step 9189: {'lr': 0.0004970955777755963, 'samples': 1764288, 'steps': 9188, 'loss/train': 1.6599271297454834} +11/06/2021 22:31:39 - INFO - __main__ - Step 9190: {'lr': 0.0004970947711575083, 'samples': 1764480, 'steps': 9189, 'loss/train': 1.8432694673538208} +11/06/2021 22:31:39 - INFO - __main__ - Step 9191: {'lr': 0.0004970939644280833, 'samples': 1764672, 'steps': 9190, 'loss/train': 1.6999132633209229} +11/06/2021 22:31:39 - INFO - __main__ - Step 9192: {'lr': 0.0004970931575873215, 'samples': 1764864, 'steps': 9191, 'loss/train': 1.533847451210022} +11/06/2021 22:31:40 - INFO - __main__ - Step 9193: {'lr': 0.0004970923506352234, 'samples': 1765056, 'steps': 9192, 'loss/train': 1.8772602081298828} +11/06/2021 22:31:40 - INFO - __main__ - Step 9194: {'lr': 0.0004970915435717893, 'samples': 1765248, 'steps': 9193, 'loss/train': 1.8430668115615845} +11/06/2021 22:31:41 - INFO - __main__ - Step 9195: {'lr': 0.0004970907363970196, 'samples': 1765440, 'steps': 9194, 'loss/train': 1.7536627054214478} +11/06/2021 22:31:41 - INFO - __main__ - Step 9196: {'lr': 0.0004970899291109145, 'samples': 1765632, 'steps': 9195, 'loss/train': 1.858238697052002} +11/06/2021 22:31:42 - INFO - __main__ - Step 9197: {'lr': 0.0004970891217134746, 'samples': 1765824, 'steps': 9196, 'loss/train': 2.1001169681549072} +11/06/2021 22:31:42 - INFO - __main__ - Step 9198: {'lr': 0.0004970883142047001, 'samples': 1766016, 'steps': 9197, 'loss/train': 2.0097129344940186} +11/06/2021 22:31:43 - INFO - __main__ - Step 9199: {'lr': 0.0004970875065845914, 'samples': 1766208, 'steps': 9198, 'loss/train': 2.0182600021362305} +11/06/2021 22:31:44 - INFO - __main__ - Step 9200: {'lr': 0.000497086698853149, 'samples': 1766400, 'steps': 9199, 'loss/train': 1.785837173461914} +11/06/2021 22:31:44 - INFO - __main__ - Step 9201: {'lr': 0.0004970858910103731, 'samples': 1766592, 'steps': 9200, 'loss/train': 1.773368000984192} +11/06/2021 22:31:44 - INFO - __main__ - Step 9202: {'lr': 0.0004970850830562641, 'samples': 1766784, 'steps': 9201, 'loss/train': 2.1283977031707764} +11/06/2021 22:31:45 - INFO - __main__ - Step 9203: {'lr': 0.0004970842749908223, 'samples': 1766976, 'steps': 9202, 'loss/train': 1.710228443145752} +11/06/2021 22:31:45 - INFO - __main__ - Step 9204: {'lr': 0.0004970834668140482, 'samples': 1767168, 'steps': 9203, 'loss/train': 1.6465903520584106} +11/06/2021 22:31:46 - INFO - __main__ - Step 9205: {'lr': 0.0004970826585259421, 'samples': 1767360, 'steps': 9204, 'loss/train': 1.8432360887527466} +11/06/2021 22:31:46 - INFO - __main__ - Step 9206: {'lr': 0.0004970818501265044, 'samples': 1767552, 'steps': 9205, 'loss/train': 1.9140604734420776} +11/06/2021 22:31:47 - INFO - __main__ - Step 9207: {'lr': 0.0004970810416157354, 'samples': 1767744, 'steps': 9206, 'loss/train': 1.4957774877548218} +11/06/2021 22:31:47 - INFO - __main__ - Step 9208: {'lr': 0.0004970802329936355, 'samples': 1767936, 'steps': 9207, 'loss/train': 1.110896110534668} +11/06/2021 22:31:47 - INFO - __main__ - Step 9209: {'lr': 0.000497079424260205, 'samples': 1768128, 'steps': 9208, 'loss/train': 2.041264057159424} +11/06/2021 22:31:48 - INFO - __main__ - Step 9210: {'lr': 0.0004970786154154444, 'samples': 1768320, 'steps': 9209, 'loss/train': 1.8915854692459106} +11/06/2021 22:31:49 - INFO - __main__ - Step 9211: {'lr': 0.000497077806459354, 'samples': 1768512, 'steps': 9210, 'loss/train': 1.495437502861023} +11/06/2021 22:31:49 - INFO - __main__ - Step 9212: {'lr': 0.0004970769973919341, 'samples': 1768704, 'steps': 9211, 'loss/train': 1.2148029804229736} +11/06/2021 22:31:50 - INFO - __main__ - Step 9213: {'lr': 0.0004970761882131851, 'samples': 1768896, 'steps': 9212, 'loss/train': 3.2807438373565674} +11/06/2021 22:31:50 - INFO - __main__ - Step 9214: {'lr': 0.0004970753789231074, 'samples': 1769088, 'steps': 9213, 'loss/train': 1.3468689918518066} +11/06/2021 22:31:50 - INFO - __main__ - Step 9215: {'lr': 0.0004970745695217014, 'samples': 1769280, 'steps': 9214, 'loss/train': 2.1012730598449707} +11/06/2021 22:31:51 - INFO - __main__ - Step 9216: {'lr': 0.0004970737600089673, 'samples': 1769472, 'steps': 9215, 'loss/train': 2.018321990966797} +11/06/2021 22:31:52 - INFO - __main__ - Step 9217: {'lr': 0.0004970729503849057, 'samples': 1769664, 'steps': 9216, 'loss/train': 0.4318278431892395} +11/06/2021 22:31:52 - INFO - __main__ - Step 9218: {'lr': 0.0004970721406495168, 'samples': 1769856, 'steps': 9217, 'loss/train': 1.8669426441192627} +11/06/2021 22:31:53 - INFO - __main__ - Step 9219: {'lr': 0.000497071330802801, 'samples': 1770048, 'steps': 9218, 'loss/train': 1.9158834218978882} +11/06/2021 22:31:53 - INFO - __main__ - Step 9220: {'lr': 0.0004970705208447587, 'samples': 1770240, 'steps': 9219, 'loss/train': 1.9058424234390259} +11/06/2021 22:31:53 - INFO - __main__ - Step 9221: {'lr': 0.0004970697107753902, 'samples': 1770432, 'steps': 9220, 'loss/train': 2.554187059402466} +11/06/2021 22:31:54 - INFO - __main__ - Step 9222: {'lr': 0.0004970689005946959, 'samples': 1770624, 'steps': 9221, 'loss/train': 1.937746286392212} +11/06/2021 22:31:55 - INFO - __main__ - Step 9223: {'lr': 0.0004970680903026762, 'samples': 1770816, 'steps': 9222, 'loss/train': 1.8598175048828125} +11/06/2021 22:31:55 - INFO - __main__ - Step 9224: {'lr': 0.0004970672798993313, 'samples': 1771008, 'steps': 9223, 'loss/train': 1.6042256355285645} +11/06/2021 22:31:55 - INFO - __main__ - Step 9225: {'lr': 0.0004970664693846618, 'samples': 1771200, 'steps': 9224, 'loss/train': 1.7904118299484253} +11/06/2021 22:31:56 - INFO - __main__ - Step 9226: {'lr': 0.000497065658758668, 'samples': 1771392, 'steps': 9225, 'loss/train': 1.8984659910202026} +11/06/2021 22:31:57 - INFO - __main__ - Step 9227: {'lr': 0.0004970648480213502, 'samples': 1771584, 'steps': 9226, 'loss/train': 2.082733631134033} +11/06/2021 22:31:57 - INFO - __main__ - Step 9228: {'lr': 0.0004970640371727088, 'samples': 1771776, 'steps': 9227, 'loss/train': 1.6446478366851807} +11/06/2021 22:31:57 - INFO - __main__ - Step 9229: {'lr': 0.0004970632262127441, 'samples': 1771968, 'steps': 9228, 'loss/train': 1.608752965927124} +11/06/2021 22:31:58 - INFO - __main__ - Step 9230: {'lr': 0.0004970624151414565, 'samples': 1772160, 'steps': 9229, 'loss/train': 1.8369768857955933} +11/06/2021 22:31:58 - INFO - __main__ - Step 9231: {'lr': 0.0004970616039588465, 'samples': 1772352, 'steps': 9230, 'loss/train': 1.8356631994247437} +11/06/2021 22:31:59 - INFO - __main__ - Step 9232: {'lr': 0.0004970607926649143, 'samples': 1772544, 'steps': 9231, 'loss/train': 1.8199883699417114} +11/06/2021 22:31:59 - INFO - __main__ - Step 9233: {'lr': 0.0004970599812596603, 'samples': 1772736, 'steps': 9232, 'loss/train': 1.2998876571655273} +11/06/2021 22:32:00 - INFO - __main__ - Step 9234: {'lr': 0.0004970591697430849, 'samples': 1772928, 'steps': 9233, 'loss/train': 1.8944025039672852} +11/06/2021 22:32:00 - INFO - __main__ - Step 9235: {'lr': 0.0004970583581151885, 'samples': 1773120, 'steps': 9234, 'loss/train': 1.8377676010131836} +11/06/2021 22:32:00 - INFO - __main__ - Step 9236: {'lr': 0.0004970575463759713, 'samples': 1773312, 'steps': 9235, 'loss/train': 1.6329200267791748} +11/06/2021 22:32:02 - INFO - __main__ - Step 9237: {'lr': 0.0004970567345254339, 'samples': 1773504, 'steps': 9236, 'loss/train': 1.544152021408081} +11/06/2021 22:32:02 - INFO - __main__ - Step 9238: {'lr': 0.0004970559225635765, 'samples': 1773696, 'steps': 9237, 'loss/train': 1.5652451515197754} +11/06/2021 22:32:02 - INFO - __main__ - Step 9239: {'lr': 0.0004970551104903995, 'samples': 1773888, 'steps': 9238, 'loss/train': 2.267305374145508} +11/06/2021 22:32:03 - INFO - __main__ - Step 9240: {'lr': 0.0004970542983059033, 'samples': 1774080, 'steps': 9239, 'loss/train': 1.8805835247039795} +11/06/2021 22:32:03 - INFO - __main__ - Step 9241: {'lr': 0.0004970534860100883, 'samples': 1774272, 'steps': 9240, 'loss/train': 1.7890807390213013} +11/06/2021 22:32:04 - INFO - __main__ - Step 9242: {'lr': 0.0004970526736029547, 'samples': 1774464, 'steps': 9241, 'loss/train': 1.4509460926055908} +11/06/2021 22:32:04 - INFO - __main__ - Step 9243: {'lr': 0.000497051861084503, 'samples': 1774656, 'steps': 9242, 'loss/train': 1.3258929252624512} +11/06/2021 22:32:05 - INFO - __main__ - Step 9244: {'lr': 0.0004970510484547336, 'samples': 1774848, 'steps': 9243, 'loss/train': 1.9906156063079834} +11/06/2021 22:32:05 - INFO - __main__ - Step 9245: {'lr': 0.0004970502357136468, 'samples': 1775040, 'steps': 9244, 'loss/train': 1.9643011093139648} +11/06/2021 22:32:05 - INFO - __main__ - Step 9246: {'lr': 0.0004970494228612429, 'samples': 1775232, 'steps': 9245, 'loss/train': 1.9511194229125977} +11/06/2021 22:32:06 - INFO - __main__ - Step 9247: {'lr': 0.0004970486098975224, 'samples': 1775424, 'steps': 9246, 'loss/train': 1.7946999073028564} +11/06/2021 22:32:07 - INFO - __main__ - Step 9248: {'lr': 0.0004970477968224856, 'samples': 1775616, 'steps': 9247, 'loss/train': 1.9336384534835815} +11/06/2021 22:32:07 - INFO - __main__ - Step 9249: {'lr': 0.000497046983636133, 'samples': 1775808, 'steps': 9248, 'loss/train': 1.3553489446640015} +11/06/2021 22:32:07 - INFO - __main__ - Step 9250: {'lr': 0.0004970461703384647, 'samples': 1776000, 'steps': 9249, 'loss/train': 1.9446792602539062} +11/06/2021 22:32:08 - INFO - __main__ - Step 9251: {'lr': 0.0004970453569294812, 'samples': 1776192, 'steps': 9250, 'loss/train': 1.8456064462661743} +11/06/2021 22:32:08 - INFO - __main__ - Step 9252: {'lr': 0.000497044543409183, 'samples': 1776384, 'steps': 9251, 'loss/train': 1.9062843322753906} +11/06/2021 22:32:09 - INFO - __main__ - Step 9253: {'lr': 0.0004970437297775702, 'samples': 1776576, 'steps': 9252, 'loss/train': 1.9113454818725586} +11/06/2021 22:32:10 - INFO - __main__ - Step 9254: {'lr': 0.0004970429160346433, 'samples': 1776768, 'steps': 9253, 'loss/train': 1.5249048471450806} +11/06/2021 22:32:10 - INFO - __main__ - Step 9255: {'lr': 0.0004970421021804027, 'samples': 1776960, 'steps': 9254, 'loss/train': 2.172207832336426} +11/06/2021 22:32:10 - INFO - __main__ - Step 9256: {'lr': 0.0004970412882148488, 'samples': 1777152, 'steps': 9255, 'loss/train': 1.1907613277435303} +11/06/2021 22:32:11 - INFO - __main__ - Step 9257: {'lr': 0.0004970404741379818, 'samples': 1777344, 'steps': 9256, 'loss/train': 1.6788753271102905} +11/06/2021 22:32:12 - INFO - __main__ - Step 9258: {'lr': 0.0004970396599498023, 'samples': 1777536, 'steps': 9257, 'loss/train': 1.072892189025879} +11/06/2021 22:32:12 - INFO - __main__ - Step 9259: {'lr': 0.0004970388456503105, 'samples': 1777728, 'steps': 9258, 'loss/train': 1.4916554689407349} +11/06/2021 22:32:13 - INFO - __main__ - Step 9260: {'lr': 0.0004970380312395069, 'samples': 1777920, 'steps': 9259, 'loss/train': 1.7013155221939087} +11/06/2021 22:32:13 - INFO - __main__ - Step 9261: {'lr': 0.0004970372167173915, 'samples': 1778112, 'steps': 9260, 'loss/train': 2.010669708251953} +11/06/2021 22:32:13 - INFO - __main__ - Step 9262: {'lr': 0.0004970364020839652, 'samples': 1778304, 'steps': 9261, 'loss/train': 1.8238394260406494} +11/06/2021 22:32:14 - INFO - __main__ - Step 9263: {'lr': 0.0004970355873392281, 'samples': 1778496, 'steps': 9262, 'loss/train': 1.3550951480865479} +11/06/2021 22:32:15 - INFO - __main__ - Step 9264: {'lr': 0.0004970347724831804, 'samples': 1778688, 'steps': 9263, 'loss/train': 1.880463719367981} +11/06/2021 22:32:15 - INFO - __main__ - Step 9265: {'lr': 0.0004970339575158228, 'samples': 1778880, 'steps': 9264, 'loss/train': 1.692347764968872} +11/06/2021 22:32:15 - INFO - __main__ - Step 9266: {'lr': 0.0004970331424371555, 'samples': 1779072, 'steps': 9265, 'loss/train': 1.760794997215271} +11/06/2021 22:32:16 - INFO - __main__ - Step 9267: {'lr': 0.0004970323272471788, 'samples': 1779264, 'steps': 9266, 'loss/train': 1.9668833017349243} +11/06/2021 22:32:16 - INFO - __main__ - Step 9268: {'lr': 0.0004970315119458931, 'samples': 1779456, 'steps': 9267, 'loss/train': 1.905427098274231} +11/06/2021 22:32:17 - INFO - __main__ - Step 9269: {'lr': 0.000497030696533299, 'samples': 1779648, 'steps': 9268, 'loss/train': 1.6687836647033691} +11/06/2021 22:32:17 - INFO - __main__ - Step 9270: {'lr': 0.0004970298810093965, 'samples': 1779840, 'steps': 9269, 'loss/train': 1.7328218221664429} +11/06/2021 22:32:18 - INFO - __main__ - Step 9271: {'lr': 0.0004970290653741863, 'samples': 1780032, 'steps': 9270, 'loss/train': 1.6917048692703247} +11/06/2021 22:32:18 - INFO - __main__ - Step 9272: {'lr': 0.0004970282496276684, 'samples': 1780224, 'steps': 9271, 'loss/train': 1.8625608682632446} +11/06/2021 22:32:19 - INFO - __main__ - Step 9273: {'lr': 0.0004970274337698436, 'samples': 1780416, 'steps': 9272, 'loss/train': 1.789774775505066} +11/06/2021 22:32:19 - INFO - __main__ - Step 9274: {'lr': 0.000497026617800712, 'samples': 1780608, 'steps': 9273, 'loss/train': 1.5155421495437622} +11/06/2021 22:32:20 - INFO - __main__ - Step 9275: {'lr': 0.000497025801720274, 'samples': 1780800, 'steps': 9274, 'loss/train': 1.8197972774505615} +11/06/2021 22:32:20 - INFO - __main__ - Step 9276: {'lr': 0.00049702498552853, 'samples': 1780992, 'steps': 9275, 'loss/train': 2.1639773845672607} +11/06/2021 22:32:21 - INFO - __main__ - Step 9277: {'lr': 0.0004970241692254803, 'samples': 1781184, 'steps': 9276, 'loss/train': 1.6572617292404175} +11/06/2021 22:32:21 - INFO - __main__ - Step 9278: {'lr': 0.0004970233528111253, 'samples': 1781376, 'steps': 9277, 'loss/train': 1.9275052547454834} +11/06/2021 22:32:22 - INFO - __main__ - Step 9279: {'lr': 0.0004970225362854654, 'samples': 1781568, 'steps': 9278, 'loss/train': 1.4207885265350342} +11/06/2021 22:32:22 - INFO - __main__ - Step 9280: {'lr': 0.0004970217196485011, 'samples': 1781760, 'steps': 9279, 'loss/train': 1.7480263710021973} +11/06/2021 22:32:23 - INFO - __main__ - Step 9281: {'lr': 0.0004970209029002325, 'samples': 1781952, 'steps': 9280, 'loss/train': 2.001077890396118} +11/06/2021 22:32:23 - INFO - __main__ - Step 9282: {'lr': 0.0004970200860406601, 'samples': 1782144, 'steps': 9281, 'loss/train': 1.4385563135147095} +11/06/2021 22:32:23 - INFO - __main__ - Step 9283: {'lr': 0.0004970192690697843, 'samples': 1782336, 'steps': 9282, 'loss/train': 1.1170109510421753} +11/06/2021 22:32:24 - INFO - __main__ - Step 9284: {'lr': 0.0004970184519876053, 'samples': 1782528, 'steps': 9283, 'loss/train': 1.6639217138290405} +11/06/2021 22:32:25 - INFO - __main__ - Step 9285: {'lr': 0.0004970176347941237, 'samples': 1782720, 'steps': 9284, 'loss/train': 1.5901360511779785} +11/06/2021 22:32:25 - INFO - __main__ - Step 9286: {'lr': 0.0004970168174893398, 'samples': 1782912, 'steps': 9285, 'loss/train': 2.016771078109741} +11/06/2021 22:32:25 - INFO - __main__ - Step 9287: {'lr': 0.0004970160000732539, 'samples': 1783104, 'steps': 9286, 'loss/train': 1.7004362344741821} +11/06/2021 22:32:26 - INFO - __main__ - Step 9288: {'lr': 0.0004970151825458664, 'samples': 1783296, 'steps': 9287, 'loss/train': 2.1699607372283936} +11/06/2021 22:32:27 - INFO - __main__ - Step 9289: {'lr': 0.0004970143649071777, 'samples': 1783488, 'steps': 9288, 'loss/train': 1.9318630695343018} +11/06/2021 22:32:27 - INFO - __main__ - Step 9290: {'lr': 0.0004970135471571881, 'samples': 1783680, 'steps': 9289, 'loss/train': 1.4492002725601196} +11/06/2021 22:32:28 - INFO - __main__ - Step 9291: {'lr': 0.000497012729295898, 'samples': 1783872, 'steps': 9290, 'loss/train': 1.6423429250717163} +11/06/2021 22:32:28 - INFO - __main__ - Step 9292: {'lr': 0.0004970119113233078, 'samples': 1784064, 'steps': 9291, 'loss/train': 1.7522389888763428} +11/06/2021 22:32:28 - INFO - __main__ - Step 9293: {'lr': 0.0004970110932394178, 'samples': 1784256, 'steps': 9292, 'loss/train': 1.4317411184310913} +11/06/2021 22:32:29 - INFO - __main__ - Step 9294: {'lr': 0.0004970102750442285, 'samples': 1784448, 'steps': 9293, 'loss/train': 2.1833393573760986} +11/06/2021 22:32:30 - INFO - __main__ - Step 9295: {'lr': 0.0004970094567377402, 'samples': 1784640, 'steps': 9294, 'loss/train': 0.5875868797302246} +11/06/2021 22:32:30 - INFO - __main__ - Step 9296: {'lr': 0.0004970086383199532, 'samples': 1784832, 'steps': 9295, 'loss/train': 2.128361701965332} +11/06/2021 22:32:30 - INFO - __main__ - Step 9297: {'lr': 0.0004970078197908678, 'samples': 1785024, 'steps': 9296, 'loss/train': 1.418079137802124} +11/06/2021 22:32:31 - INFO - __main__ - Step 9298: {'lr': 0.0004970070011504846, 'samples': 1785216, 'steps': 9297, 'loss/train': 1.8061836957931519} +11/06/2021 22:32:31 - INFO - __main__ - Step 9299: {'lr': 0.0004970061823988038, 'samples': 1785408, 'steps': 9298, 'loss/train': 1.9081430435180664} +11/06/2021 22:32:32 - INFO - __main__ - Step 9300: {'lr': 0.0004970053635358259, 'samples': 1785600, 'steps': 9299, 'loss/train': 1.5807913541793823} +11/06/2021 22:32:33 - INFO - __main__ - Step 9301: {'lr': 0.0004970045445615512, 'samples': 1785792, 'steps': 9300, 'loss/train': 1.5762659311294556} +11/06/2021 22:32:33 - INFO - __main__ - Step 9302: {'lr': 0.00049700372547598, 'samples': 1785984, 'steps': 9301, 'loss/train': 1.5313711166381836} +11/06/2021 22:32:33 - INFO - __main__ - Step 9303: {'lr': 0.0004970029062791128, 'samples': 1786176, 'steps': 9302, 'loss/train': 1.933624505996704} +11/06/2021 22:32:34 - INFO - __main__ - Step 9304: {'lr': 0.0004970020869709498, 'samples': 1786368, 'steps': 9303, 'loss/train': 1.6305302381515503} +11/06/2021 22:32:35 - INFO - __main__ - Step 9305: {'lr': 0.0004970012675514915, 'samples': 1786560, 'steps': 9304, 'loss/train': 1.5275381803512573} +11/06/2021 22:32:35 - INFO - __main__ - Step 9306: {'lr': 0.0004970004480207384, 'samples': 1786752, 'steps': 9305, 'loss/train': 1.6243155002593994} +11/06/2021 22:32:35 - INFO - __main__ - Step 9307: {'lr': 0.0004969996283786905, 'samples': 1786944, 'steps': 9306, 'loss/train': 1.8101203441619873} +11/06/2021 22:32:36 - INFO - __main__ - Step 9308: {'lr': 0.0004969988086253486, 'samples': 1787136, 'steps': 9307, 'loss/train': 1.9703173637390137} +11/06/2021 22:32:36 - INFO - __main__ - Step 9309: {'lr': 0.0004969979887607125, 'samples': 1787328, 'steps': 9308, 'loss/train': 1.6925435066223145} +11/06/2021 22:32:37 - INFO - __main__ - Step 9310: {'lr': 0.0004969971687847832, 'samples': 1787520, 'steps': 9309, 'loss/train': 2.585664749145508} +11/06/2021 22:32:37 - INFO - __main__ - Step 9311: {'lr': 0.0004969963486975607, 'samples': 1787712, 'steps': 9310, 'loss/train': 1.2041494846343994} +11/06/2021 22:32:38 - INFO - __main__ - Step 9312: {'lr': 0.0004969955284990455, 'samples': 1787904, 'steps': 9311, 'loss/train': 1.6597546339035034} +11/06/2021 22:32:38 - INFO - __main__ - Step 9313: {'lr': 0.0004969947081892379, 'samples': 1788096, 'steps': 9312, 'loss/train': 1.6976758241653442} +11/06/2021 22:32:38 - INFO - __main__ - Step 9314: {'lr': 0.0004969938877681383, 'samples': 1788288, 'steps': 9313, 'loss/train': 1.9452763795852661} +11/06/2021 22:32:39 - INFO - __main__ - Step 9315: {'lr': 0.0004969930672357471, 'samples': 1788480, 'steps': 9314, 'loss/train': 2.183551788330078} +11/06/2021 22:32:40 - INFO - __main__ - Step 9316: {'lr': 0.0004969922465920645, 'samples': 1788672, 'steps': 9315, 'loss/train': 2.362039089202881} +11/06/2021 22:32:40 - INFO - __main__ - Step 9317: {'lr': 0.0004969914258370912, 'samples': 1788864, 'steps': 9316, 'loss/train': 2.2192182540893555} +11/06/2021 22:32:41 - INFO - __main__ - Step 9318: {'lr': 0.0004969906049708272, 'samples': 1789056, 'steps': 9317, 'loss/train': 1.708990454673767} +11/06/2021 22:32:41 - INFO - __main__ - Step 9319: {'lr': 0.0004969897839932732, 'samples': 1789248, 'steps': 9318, 'loss/train': 1.988546371459961} +11/06/2021 22:32:41 - INFO - __main__ - Step 9320: {'lr': 0.0004969889629044293, 'samples': 1789440, 'steps': 9319, 'loss/train': 1.3980268239974976} +11/06/2021 22:32:42 - INFO - __main__ - Step 9321: {'lr': 0.000496988141704296, 'samples': 1789632, 'steps': 9320, 'loss/train': 6.165026664733887} +11/06/2021 22:32:43 - INFO - __main__ - Step 9322: {'lr': 0.0004969873203928737, 'samples': 1789824, 'steps': 9321, 'loss/train': 1.2539154291152954} +11/06/2021 22:32:43 - INFO - __main__ - Step 9323: {'lr': 0.0004969864989701626, 'samples': 1790016, 'steps': 9322, 'loss/train': 1.7540534734725952} +11/06/2021 22:32:43 - INFO - __main__ - Step 9324: {'lr': 0.0004969856774361634, 'samples': 1790208, 'steps': 9323, 'loss/train': 1.9644792079925537} +11/06/2021 22:32:44 - INFO - __main__ - Step 9325: {'lr': 0.0004969848557908761, 'samples': 1790400, 'steps': 9324, 'loss/train': 1.722193717956543} +11/06/2021 22:32:44 - INFO - __main__ - Step 9326: {'lr': 0.0004969840340343013, 'samples': 1790592, 'steps': 9325, 'loss/train': 2.381248712539673} +11/06/2021 22:32:45 - INFO - __main__ - Step 9327: {'lr': 0.0004969832121664394, 'samples': 1790784, 'steps': 9326, 'loss/train': 1.3223377466201782} +11/06/2021 22:32:46 - INFO - __main__ - Step 9328: {'lr': 0.0004969823901872906, 'samples': 1790976, 'steps': 9327, 'loss/train': 2.1059629917144775} +11/06/2021 22:32:46 - INFO - __main__ - Step 9329: {'lr': 0.0004969815680968552, 'samples': 1791168, 'steps': 9328, 'loss/train': 1.7567250728607178} +11/06/2021 22:32:46 - INFO - __main__ - Step 9330: {'lr': 0.0004969807458951339, 'samples': 1791360, 'steps': 9329, 'loss/train': 1.10848867893219} +11/06/2021 22:32:47 - INFO - __main__ - Step 9331: {'lr': 0.0004969799235821268, 'samples': 1791552, 'steps': 9330, 'loss/train': 1.527244210243225} +11/06/2021 22:32:48 - INFO - __main__ - Step 9332: {'lr': 0.0004969791011578344, 'samples': 1791744, 'steps': 9331, 'loss/train': 1.9717392921447754} +11/06/2021 22:32:48 - INFO - __main__ - Step 9333: {'lr': 0.000496978278622257, 'samples': 1791936, 'steps': 9332, 'loss/train': 1.1061983108520508} +11/06/2021 22:32:48 - INFO - __main__ - Step 9334: {'lr': 0.000496977455975395, 'samples': 1792128, 'steps': 9333, 'loss/train': 1.6116451025009155} +11/06/2021 22:32:49 - INFO - __main__ - Step 9335: {'lr': 0.0004969766332172488, 'samples': 1792320, 'steps': 9334, 'loss/train': 2.009783983230591} +11/06/2021 22:32:49 - INFO - __main__ - Step 9336: {'lr': 0.0004969758103478187, 'samples': 1792512, 'steps': 9335, 'loss/train': 1.6776036024093628} +11/06/2021 22:32:50 - INFO - __main__ - Step 9337: {'lr': 0.0004969749873671051, 'samples': 1792704, 'steps': 9336, 'loss/train': 1.6824532747268677} +11/06/2021 22:32:50 - INFO - __main__ - Step 9338: {'lr': 0.0004969741642751085, 'samples': 1792896, 'steps': 9337, 'loss/train': 1.9121274948120117} +11/06/2021 22:32:51 - INFO - __main__ - Step 9339: {'lr': 0.000496973341071829, 'samples': 1793088, 'steps': 9338, 'loss/train': 1.8858976364135742} +11/06/2021 22:32:51 - INFO - __main__ - Step 9340: {'lr': 0.0004969725177572672, 'samples': 1793280, 'steps': 9339, 'loss/train': 1.5066814422607422} +11/06/2021 22:32:51 - INFO - __main__ - Step 9341: {'lr': 0.0004969716943314234, 'samples': 1793472, 'steps': 9340, 'loss/train': 1.8776342868804932} +11/06/2021 22:32:52 - INFO - __main__ - Step 9342: {'lr': 0.0004969708707942979, 'samples': 1793664, 'steps': 9341, 'loss/train': 2.180288314819336} +11/06/2021 22:32:53 - INFO - __main__ - Step 9343: {'lr': 0.0004969700471458913, 'samples': 1793856, 'steps': 9342, 'loss/train': 1.4142295122146606} +11/06/2021 22:32:53 - INFO - __main__ - Step 9344: {'lr': 0.0004969692233862036, 'samples': 1794048, 'steps': 9343, 'loss/train': 1.8621501922607422} +11/06/2021 22:32:53 - INFO - __main__ - Step 9345: {'lr': 0.0004969683995152355, 'samples': 1794240, 'steps': 9344, 'loss/train': 3.186241626739502} +11/06/2021 22:32:54 - INFO - __main__ - Step 9346: {'lr': 0.0004969675755329872, 'samples': 1794432, 'steps': 9345, 'loss/train': 1.875054121017456} +11/06/2021 22:32:55 - INFO - __main__ - Step 9347: {'lr': 0.0004969667514394592, 'samples': 1794624, 'steps': 9346, 'loss/train': 2.312483072280884} +11/06/2021 22:32:55 - INFO - __main__ - Step 9348: {'lr': 0.0004969659272346517, 'samples': 1794816, 'steps': 9347, 'loss/train': 1.7761608362197876} +11/06/2021 22:32:56 - INFO - __main__ - Step 9349: {'lr': 0.0004969651029185652, 'samples': 1795008, 'steps': 9348, 'loss/train': 1.646713137626648} +11/06/2021 22:32:56 - INFO - __main__ - Step 9350: {'lr': 0.0004969642784912001, 'samples': 1795200, 'steps': 9349, 'loss/train': 3.636963367462158} +11/06/2021 22:32:57 - INFO - __main__ - Step 9351: {'lr': 0.0004969634539525566, 'samples': 1795392, 'steps': 9350, 'loss/train': 2.115077495574951} +11/06/2021 22:32:57 - INFO - __main__ - Step 9352: {'lr': 0.0004969626293026353, 'samples': 1795584, 'steps': 9351, 'loss/train': 1.7228342294692993} +11/06/2021 22:32:58 - INFO - __main__ - Step 9353: {'lr': 0.0004969618045414363, 'samples': 1795776, 'steps': 9352, 'loss/train': 1.540665626525879} +11/06/2021 22:32:58 - INFO - __main__ - Step 9354: {'lr': 0.0004969609796689602, 'samples': 1795968, 'steps': 9353, 'loss/train': 1.7847797870635986} +11/06/2021 22:32:59 - INFO - __main__ - Step 9355: {'lr': 0.0004969601546852073, 'samples': 1796160, 'steps': 9354, 'loss/train': 1.4905754327774048} +11/06/2021 22:32:59 - INFO - __main__ - Step 9356: {'lr': 0.0004969593295901779, 'samples': 1796352, 'steps': 9355, 'loss/train': 1.998396873474121} +11/06/2021 22:32:59 - INFO - __main__ - Step 9357: {'lr': 0.0004969585043838725, 'samples': 1796544, 'steps': 9356, 'loss/train': 2.060382127761841} +11/06/2021 22:33:00 - INFO - __main__ - Step 9358: {'lr': 0.0004969576790662914, 'samples': 1796736, 'steps': 9357, 'loss/train': 1.823445200920105} +11/06/2021 22:33:01 - INFO - __main__ - Step 9359: {'lr': 0.0004969568536374349, 'samples': 1796928, 'steps': 9358, 'loss/train': 1.6767795085906982} +11/06/2021 22:33:01 - INFO - __main__ - Step 9360: {'lr': 0.0004969560280973036, 'samples': 1797120, 'steps': 9359, 'loss/train': 2.0261526107788086} +11/06/2021 22:33:01 - INFO - __main__ - Step 9361: {'lr': 0.0004969552024458976, 'samples': 1797312, 'steps': 9360, 'loss/train': 1.6986967325210571} +11/06/2021 22:33:02 - INFO - __main__ - Step 9362: {'lr': 0.0004969543766832176, 'samples': 1797504, 'steps': 9361, 'loss/train': 1.3113603591918945} +11/06/2021 22:33:03 - INFO - __main__ - Step 9363: {'lr': 0.0004969535508092635, 'samples': 1797696, 'steps': 9362, 'loss/train': 1.4548332691192627} +11/06/2021 22:33:03 - INFO - __main__ - Step 9364: {'lr': 0.0004969527248240361, 'samples': 1797888, 'steps': 9363, 'loss/train': 2.1433870792388916} +11/06/2021 22:33:03 - INFO - __main__ - Step 9365: {'lr': 0.0004969518987275356, 'samples': 1798080, 'steps': 9364, 'loss/train': 1.7857718467712402} +11/06/2021 22:33:04 - INFO - __main__ - Step 9366: {'lr': 0.0004969510725197624, 'samples': 1798272, 'steps': 9365, 'loss/train': 1.3735690116882324} +11/06/2021 22:33:04 - INFO - __main__ - Step 9367: {'lr': 0.0004969502462007167, 'samples': 1798464, 'steps': 9366, 'loss/train': 2.3249306678771973} +11/06/2021 22:33:05 - INFO - __main__ - Step 9368: {'lr': 0.0004969494197703992, 'samples': 1798656, 'steps': 9367, 'loss/train': 1.9111498594284058} +11/06/2021 22:33:05 - INFO - __main__ - Step 9369: {'lr': 0.00049694859322881, 'samples': 1798848, 'steps': 9368, 'loss/train': 1.7562119960784912} +11/06/2021 22:33:06 - INFO - __main__ - Step 9370: {'lr': 0.0004969477665759496, 'samples': 1799040, 'steps': 9369, 'loss/train': 1.8081409931182861} +11/06/2021 22:33:06 - INFO - __main__ - Step 9371: {'lr': 0.0004969469398118184, 'samples': 1799232, 'steps': 9370, 'loss/train': 1.3036324977874756} +11/06/2021 22:33:07 - INFO - __main__ - Step 9372: {'lr': 0.0004969461129364167, 'samples': 1799424, 'steps': 9371, 'loss/train': 1.8562147617340088} +11/06/2021 22:33:08 - INFO - __main__ - Step 9373: {'lr': 0.0004969452859497449, 'samples': 1799616, 'steps': 9372, 'loss/train': 1.927634596824646} +11/06/2021 22:33:08 - INFO - __main__ - Step 9374: {'lr': 0.0004969444588518034, 'samples': 1799808, 'steps': 9373, 'loss/train': 2.170872449874878} +11/06/2021 22:33:08 - INFO - __main__ - Step 9375: {'lr': 0.0004969436316425924, 'samples': 1800000, 'steps': 9374, 'loss/train': 1.852042317390442} +11/06/2021 22:33:09 - INFO - __main__ - Step 9376: {'lr': 0.0004969428043221125, 'samples': 1800192, 'steps': 9375, 'loss/train': 1.5770512819290161} +11/06/2021 22:33:09 - INFO - __main__ - Step 9377: {'lr': 0.000496941976890364, 'samples': 1800384, 'steps': 9376, 'loss/train': 1.6627328395843506} +11/06/2021 22:33:09 - INFO - __main__ - Step 9378: {'lr': 0.0004969411493473472, 'samples': 1800576, 'steps': 9377, 'loss/train': 1.592746376991272} +11/06/2021 22:33:11 - INFO - __main__ - Step 9379: {'lr': 0.0004969403216930626, 'samples': 1800768, 'steps': 9378, 'loss/train': 1.5629326105117798} +11/06/2021 22:33:11 - INFO - __main__ - Step 9380: {'lr': 0.0004969394939275105, 'samples': 1800960, 'steps': 9379, 'loss/train': 1.9716914892196655} +11/06/2021 22:33:11 - INFO - __main__ - Step 9381: {'lr': 0.0004969386660506912, 'samples': 1801152, 'steps': 9380, 'loss/train': 1.612454891204834} +11/06/2021 22:33:12 - INFO - __main__ - Step 9382: {'lr': 0.0004969378380626051, 'samples': 1801344, 'steps': 9381, 'loss/train': 1.764012336730957} +11/06/2021 22:33:12 - INFO - __main__ - Step 9383: {'lr': 0.0004969370099632528, 'samples': 1801536, 'steps': 9382, 'loss/train': 1.9213483333587646} +11/06/2021 22:33:13 - INFO - __main__ - Step 9384: {'lr': 0.0004969361817526343, 'samples': 1801728, 'steps': 9383, 'loss/train': 1.2012592554092407} +11/06/2021 22:33:14 - INFO - __main__ - Step 9385: {'lr': 0.0004969353534307504, 'samples': 1801920, 'steps': 9384, 'loss/train': 2.151750087738037} +11/06/2021 22:33:14 - INFO - __main__ - Step 9386: {'lr': 0.000496934524997601, 'samples': 1802112, 'steps': 9385, 'loss/train': 0.9660016894340515} +11/06/2021 22:33:14 - INFO - __main__ - Step 9387: {'lr': 0.0004969336964531869, 'samples': 1802304, 'steps': 9386, 'loss/train': 1.7892236709594727} +11/06/2021 22:33:15 - INFO - __main__ - Step 9388: {'lr': 0.0004969328677975083, 'samples': 1802496, 'steps': 9387, 'loss/train': 1.6319315433502197} +11/06/2021 22:33:15 - INFO - __main__ - Step 9389: {'lr': 0.0004969320390305654, 'samples': 1802688, 'steps': 9388, 'loss/train': 2.0772619247436523} +11/06/2021 22:33:16 - INFO - __main__ - Step 9390: {'lr': 0.0004969312101523588, 'samples': 1802880, 'steps': 9389, 'loss/train': 1.8143119812011719} +11/06/2021 22:33:17 - INFO - __main__ - Step 9391: {'lr': 0.0004969303811628888, 'samples': 1803072, 'steps': 9390, 'loss/train': 1.7659382820129395} +11/06/2021 22:33:17 - INFO - __main__ - Step 9392: {'lr': 0.0004969295520621558, 'samples': 1803264, 'steps': 9391, 'loss/train': 2.3056082725524902} +11/06/2021 22:33:17 - INFO - __main__ - Step 9393: {'lr': 0.0004969287228501602, 'samples': 1803456, 'steps': 9392, 'loss/train': 1.8238893747329712} +11/06/2021 22:33:18 - INFO - __main__ - Step 9394: {'lr': 0.0004969278935269022, 'samples': 1803648, 'steps': 9393, 'loss/train': 0.7025987505912781} +11/06/2021 22:33:19 - INFO - __main__ - Step 9395: {'lr': 0.0004969270640923823, 'samples': 1803840, 'steps': 9394, 'loss/train': 1.8956180810928345} +11/06/2021 22:33:19 - INFO - __main__ - Step 9396: {'lr': 0.0004969262345466011, 'samples': 1804032, 'steps': 9395, 'loss/train': 1.8042242527008057} +11/06/2021 22:33:19 - INFO - __main__ - Step 9397: {'lr': 0.0004969254048895585, 'samples': 1804224, 'steps': 9396, 'loss/train': 1.8003126382827759} +11/06/2021 22:33:20 - INFO - __main__ - Step 9398: {'lr': 0.0004969245751212552, 'samples': 1804416, 'steps': 9397, 'loss/train': 1.8957905769348145} +11/06/2021 22:33:20 - INFO - __main__ - Step 9399: {'lr': 0.0004969237452416915, 'samples': 1804608, 'steps': 9398, 'loss/train': 1.0701171159744263} +11/06/2021 22:33:21 - INFO - __main__ - Step 9400: {'lr': 0.0004969229152508678, 'samples': 1804800, 'steps': 9399, 'loss/train': 1.8020981550216675} +11/06/2021 22:33:22 - INFO - __main__ - Step 9401: {'lr': 0.0004969220851487844, 'samples': 1804992, 'steps': 9400, 'loss/train': 0.40175554156303406} +11/06/2021 22:33:22 - INFO - __main__ - Step 9402: {'lr': 0.0004969212549354418, 'samples': 1805184, 'steps': 9401, 'loss/train': 1.8108609914779663} +11/06/2021 22:33:22 - INFO - __main__ - Step 9403: {'lr': 0.0004969204246108402, 'samples': 1805376, 'steps': 9402, 'loss/train': 1.1330207586288452} +11/06/2021 22:33:23 - INFO - __main__ - Step 9404: {'lr': 0.0004969195941749801, 'samples': 1805568, 'steps': 9403, 'loss/train': 1.2011972665786743} +11/06/2021 22:33:23 - INFO - __main__ - Step 9405: {'lr': 0.000496918763627862, 'samples': 1805760, 'steps': 9404, 'loss/train': 1.7720991373062134} +11/06/2021 22:33:24 - INFO - __main__ - Step 9406: {'lr': 0.0004969179329694859, 'samples': 1805952, 'steps': 9405, 'loss/train': 1.7720216512680054} +11/06/2021 22:33:24 - INFO - __main__ - Step 9407: {'lr': 0.0004969171021998525, 'samples': 1806144, 'steps': 9406, 'loss/train': 1.1517207622528076} +11/06/2021 22:33:25 - INFO - __main__ - Step 9408: {'lr': 0.0004969162713189619, 'samples': 1806336, 'steps': 9407, 'loss/train': 1.5206893682479858} +11/06/2021 22:33:25 - INFO - __main__ - Step 9409: {'lr': 0.0004969154403268148, 'samples': 1806528, 'steps': 9408, 'loss/train': 1.8082882165908813} +11/06/2021 22:33:25 - INFO - __main__ - Step 9410: {'lr': 0.0004969146092234114, 'samples': 1806720, 'steps': 9409, 'loss/train': 1.3360158205032349} +11/06/2021 22:33:26 - INFO - __main__ - Step 9411: {'lr': 0.000496913778008752, 'samples': 1806912, 'steps': 9410, 'loss/train': 2.1113593578338623} +11/06/2021 22:33:27 - INFO - __main__ - Step 9412: {'lr': 0.0004969129466828371, 'samples': 1807104, 'steps': 9411, 'loss/train': 2.4222865104675293} +11/06/2021 22:33:27 - INFO - __main__ - Step 9413: {'lr': 0.0004969121152456671, 'samples': 1807296, 'steps': 9412, 'loss/train': 1.631757378578186} +11/06/2021 22:33:27 - INFO - __main__ - Step 9414: {'lr': 0.0004969112836972423, 'samples': 1807488, 'steps': 9413, 'loss/train': 1.678197979927063} +11/06/2021 22:33:28 - INFO - __main__ - Step 9415: {'lr': 0.000496910452037563, 'samples': 1807680, 'steps': 9414, 'loss/train': 2.7772085666656494} +11/06/2021 22:33:29 - INFO - __main__ - Step 9416: {'lr': 0.0004969096202666297, 'samples': 1807872, 'steps': 9415, 'loss/train': 1.9640326499938965} +11/06/2021 22:33:29 - INFO - __main__ - Step 9417: {'lr': 0.0004969087883844428, 'samples': 1808064, 'steps': 9416, 'loss/train': 1.4064429998397827} +11/06/2021 22:33:30 - INFO - __main__ - Step 9418: {'lr': 0.0004969079563910025, 'samples': 1808256, 'steps': 9417, 'loss/train': 1.8658392429351807} +11/06/2021 22:33:30 - INFO - __main__ - Step 9419: {'lr': 0.0004969071242863093, 'samples': 1808448, 'steps': 9418, 'loss/train': 2.186412811279297} +11/06/2021 22:33:30 - INFO - __main__ - Step 9420: {'lr': 0.0004969062920703636, 'samples': 1808640, 'steps': 9419, 'loss/train': 1.6242451667785645} +11/06/2021 22:33:31 - INFO - __main__ - Step 9421: {'lr': 0.0004969054597431658, 'samples': 1808832, 'steps': 9420, 'loss/train': 2.4329140186309814} +11/06/2021 22:33:32 - INFO - __main__ - Step 9422: {'lr': 0.0004969046273047161, 'samples': 1809024, 'steps': 9421, 'loss/train': 1.61650812625885} +11/06/2021 22:33:32 - INFO - __main__ - Step 9423: {'lr': 0.0004969037947550151, 'samples': 1809216, 'steps': 9422, 'loss/train': 1.550029993057251} +11/06/2021 22:33:32 - INFO - __main__ - Step 9424: {'lr': 0.000496902962094063, 'samples': 1809408, 'steps': 9423, 'loss/train': 1.670718789100647} +11/06/2021 22:33:33 - INFO - __main__ - Step 9425: {'lr': 0.0004969021293218602, 'samples': 1809600, 'steps': 9424, 'loss/train': 1.6841366291046143} +11/06/2021 22:33:34 - INFO - __main__ - Step 9426: {'lr': 0.0004969012964384071, 'samples': 1809792, 'steps': 9425, 'loss/train': 2.19000244140625} +11/06/2021 22:33:34 - INFO - __main__ - Step 9427: {'lr': 0.0004969004634437042, 'samples': 1809984, 'steps': 9426, 'loss/train': 1.5909390449523926} +11/06/2021 22:33:34 - INFO - __main__ - Step 9428: {'lr': 0.0004968996303377517, 'samples': 1810176, 'steps': 9427, 'loss/train': 2.3377866744995117} +11/06/2021 22:33:35 - INFO - __main__ - Step 9429: {'lr': 0.00049689879712055, 'samples': 1810368, 'steps': 9428, 'loss/train': 1.959466576576233} +11/06/2021 22:33:35 - INFO - __main__ - Step 9430: {'lr': 0.0004968979637920995, 'samples': 1810560, 'steps': 9429, 'loss/train': 2.1791741847991943} +11/06/2021 22:33:35 - INFO - __main__ - Step 9431: {'lr': 0.0004968971303524007, 'samples': 1810752, 'steps': 9430, 'loss/train': 1.2849524021148682} +11/06/2021 22:33:36 - INFO - __main__ - Step 9432: {'lr': 0.0004968962968014537, 'samples': 1810944, 'steps': 9431, 'loss/train': 1.7930939197540283} +11/06/2021 22:33:37 - INFO - __main__ - Step 9433: {'lr': 0.0004968954631392592, 'samples': 1811136, 'steps': 9432, 'loss/train': 1.8857711553573608} +11/06/2021 22:33:37 - INFO - __main__ - Step 9434: {'lr': 0.0004968946293658173, 'samples': 1811328, 'steps': 9433, 'loss/train': 1.6014503240585327} +11/06/2021 22:33:37 - INFO - __main__ - Step 9435: {'lr': 0.0004968937954811284, 'samples': 1811520, 'steps': 9434, 'loss/train': 1.701316237449646} +11/06/2021 22:33:38 - INFO - __main__ - Step 9436: {'lr': 0.0004968929614851932, 'samples': 1811712, 'steps': 9435, 'loss/train': 1.106537938117981} +11/06/2021 22:33:39 - INFO - __main__ - Step 9437: {'lr': 0.0004968921273780118, 'samples': 1811904, 'steps': 9436, 'loss/train': 1.812904715538025} +11/06/2021 22:33:39 - INFO - __main__ - Step 9438: {'lr': 0.0004968912931595845, 'samples': 1812096, 'steps': 9437, 'loss/train': 1.294390082359314} +11/06/2021 22:33:39 - INFO - __main__ - Step 9439: {'lr': 0.0004968904588299118, 'samples': 1812288, 'steps': 9438, 'loss/train': 1.2054589986801147} +11/06/2021 22:33:40 - INFO - __main__ - Step 9440: {'lr': 0.0004968896243889941, 'samples': 1812480, 'steps': 9439, 'loss/train': 1.6848827600479126} +11/06/2021 22:33:40 - INFO - __main__ - Step 9441: {'lr': 0.0004968887898368318, 'samples': 1812672, 'steps': 9440, 'loss/train': 2.0966432094573975} +11/06/2021 22:33:41 - INFO - __main__ - Step 9442: {'lr': 0.0004968879551734252, 'samples': 1812864, 'steps': 9441, 'loss/train': 1.6406598091125488} +11/06/2021 22:33:42 - INFO - __main__ - Step 9443: {'lr': 0.0004968871203987746, 'samples': 1813056, 'steps': 9442, 'loss/train': 1.871316909790039} +11/06/2021 22:33:42 - INFO - __main__ - Step 9444: {'lr': 0.0004968862855128806, 'samples': 1813248, 'steps': 9443, 'loss/train': 1.394817590713501} +11/06/2021 22:33:42 - INFO - __main__ - Step 9445: {'lr': 0.0004968854505157434, 'samples': 1813440, 'steps': 9444, 'loss/train': 1.726036787033081} +11/06/2021 22:33:43 - INFO - __main__ - Step 9446: {'lr': 0.0004968846154073634, 'samples': 1813632, 'steps': 9445, 'loss/train': 0.7175917625427246} +11/06/2021 22:33:44 - INFO - __main__ - Step 9447: {'lr': 0.0004968837801877411, 'samples': 1813824, 'steps': 9446, 'loss/train': 1.9097816944122314} +11/06/2021 22:33:44 - INFO - __main__ - Step 9448: {'lr': 0.0004968829448568766, 'samples': 1814016, 'steps': 9447, 'loss/train': 1.6947396993637085} +11/06/2021 22:33:44 - INFO - __main__ - Step 9449: {'lr': 0.0004968821094147706, 'samples': 1814208, 'steps': 9448, 'loss/train': 1.652908205986023} +11/06/2021 22:33:45 - INFO - __main__ - Step 9450: {'lr': 0.0004968812738614232, 'samples': 1814400, 'steps': 9449, 'loss/train': 1.8884683847427368} +11/06/2021 22:33:45 - INFO - __main__ - Step 9451: {'lr': 0.000496880438196835, 'samples': 1814592, 'steps': 9450, 'loss/train': 1.878915786743164} +11/06/2021 22:33:46 - INFO - __main__ - Step 9452: {'lr': 0.0004968796024210064, 'samples': 1814784, 'steps': 9451, 'loss/train': 1.934395670890808} +11/06/2021 22:33:46 - INFO - __main__ - Step 9453: {'lr': 0.0004968787665339375, 'samples': 1814976, 'steps': 9452, 'loss/train': 1.7748756408691406} +11/06/2021 22:33:47 - INFO - __main__ - Step 9454: {'lr': 0.0004968779305356289, 'samples': 1815168, 'steps': 9453, 'loss/train': 1.8355199098587036} +11/06/2021 22:33:47 - INFO - __main__ - Step 9455: {'lr': 0.0004968770944260808, 'samples': 1815360, 'steps': 9454, 'loss/train': 1.931564450263977} +11/06/2021 22:33:47 - INFO - __main__ - Step 9456: {'lr': 0.0004968762582052938, 'samples': 1815552, 'steps': 9455, 'loss/train': 1.959632396697998} +11/06/2021 22:33:48 - INFO - __main__ - Step 9457: {'lr': 0.0004968754218732682, 'samples': 1815744, 'steps': 9456, 'loss/train': 1.8338159322738647} +11/06/2021 22:33:49 - INFO - __main__ - Step 9458: {'lr': 0.0004968745854300043, 'samples': 1815936, 'steps': 9457, 'loss/train': 1.7420405149459839} +11/06/2021 22:33:49 - INFO - __main__ - Step 9459: {'lr': 0.0004968737488755025, 'samples': 1816128, 'steps': 9458, 'loss/train': 1.8314000368118286} +11/06/2021 22:33:49 - INFO - __main__ - Step 9460: {'lr': 0.0004968729122097632, 'samples': 1816320, 'steps': 9459, 'loss/train': 1.9877064228057861} +11/06/2021 22:33:50 - INFO - __main__ - Step 9461: {'lr': 0.0004968720754327867, 'samples': 1816512, 'steps': 9460, 'loss/train': 1.5283275842666626} +11/06/2021 22:33:51 - INFO - __main__ - Step 9462: {'lr': 0.0004968712385445737, 'samples': 1816704, 'steps': 9461, 'loss/train': 1.5519593954086304} +11/06/2021 22:33:51 - INFO - __main__ - Step 9463: {'lr': 0.0004968704015451241, 'samples': 1816896, 'steps': 9462, 'loss/train': 2.173038959503174} +11/06/2021 22:33:51 - INFO - __main__ - Step 9464: {'lr': 0.0004968695644344387, 'samples': 1817088, 'steps': 9463, 'loss/train': 2.0512888431549072} +11/06/2021 22:33:52 - INFO - __main__ - Step 9465: {'lr': 0.0004968687272125174, 'samples': 1817280, 'steps': 9464, 'loss/train': 1.5592188835144043} +11/06/2021 22:33:52 - INFO - __main__ - Step 9466: {'lr': 0.0004968678898793611, 'samples': 1817472, 'steps': 9465, 'loss/train': 1.7354072332382202} +11/06/2021 22:33:53 - INFO - __main__ - Step 9467: {'lr': 0.0004968670524349699, 'samples': 1817664, 'steps': 9466, 'loss/train': 1.9592326879501343} +11/06/2021 22:33:54 - INFO - __main__ - Step 9468: {'lr': 0.0004968662148793441, 'samples': 1817856, 'steps': 9467, 'loss/train': 1.6401126384735107} +11/06/2021 22:33:54 - INFO - __main__ - Step 9469: {'lr': 0.0004968653772124843, 'samples': 1818048, 'steps': 9468, 'loss/train': 1.6802074909210205} +11/06/2021 22:33:54 - INFO - __main__ - Step 9470: {'lr': 0.0004968645394343908, 'samples': 1818240, 'steps': 9469, 'loss/train': 1.5846213102340698} +11/06/2021 22:33:55 - INFO - __main__ - Step 9471: {'lr': 0.0004968637015450639, 'samples': 1818432, 'steps': 9470, 'loss/train': 1.8173738718032837} +11/06/2021 22:33:55 - INFO - __main__ - Step 9472: {'lr': 0.000496862863544504, 'samples': 1818624, 'steps': 9471, 'loss/train': 1.4764689207077026} +11/06/2021 22:33:56 - INFO - __main__ - Step 9473: {'lr': 0.0004968620254327114, 'samples': 1818816, 'steps': 9472, 'loss/train': 1.9476569890975952} +11/06/2021 22:33:56 - INFO - __main__ - Step 9474: {'lr': 0.0004968611872096868, 'samples': 1819008, 'steps': 9473, 'loss/train': 1.7643886804580688} +11/06/2021 22:33:57 - INFO - __main__ - Step 9475: {'lr': 0.0004968603488754302, 'samples': 1819200, 'steps': 9474, 'loss/train': 1.442833423614502} +11/06/2021 22:33:57 - INFO - __main__ - Step 9476: {'lr': 0.0004968595104299422, 'samples': 1819392, 'steps': 9475, 'loss/train': 2.2946574687957764} +11/06/2021 22:33:57 - INFO - __main__ - Step 9477: {'lr': 0.000496858671873223, 'samples': 1819584, 'steps': 9476, 'loss/train': 2.2401070594787598} +11/06/2021 22:33:58 - INFO - __main__ - Step 9478: {'lr': 0.0004968578332052733, 'samples': 1819776, 'steps': 9477, 'loss/train': 1.696811556816101} +11/06/2021 22:33:59 - INFO - __main__ - Step 9479: {'lr': 0.0004968569944260932, 'samples': 1819968, 'steps': 9478, 'loss/train': 2.2511560916900635} +11/06/2021 22:33:59 - INFO - __main__ - Step 9480: {'lr': 0.0004968561555356831, 'samples': 1820160, 'steps': 9479, 'loss/train': 1.6641721725463867} +11/06/2021 22:33:59 - INFO - __main__ - Step 9481: {'lr': 0.0004968553165340435, 'samples': 1820352, 'steps': 9480, 'loss/train': 1.7705086469650269} +11/06/2021 22:34:00 - INFO - __main__ - Step 9482: {'lr': 0.0004968544774211746, 'samples': 1820544, 'steps': 9481, 'loss/train': 1.7317209243774414} +11/06/2021 22:34:01 - INFO - __main__ - Step 9483: {'lr': 0.0004968536381970769, 'samples': 1820736, 'steps': 9482, 'loss/train': 1.7108385562896729} +11/06/2021 22:34:01 - INFO - __main__ - Step 9484: {'lr': 0.0004968527988617508, 'samples': 1820928, 'steps': 9483, 'loss/train': 1.9148114919662476} +11/06/2021 22:34:02 - INFO - __main__ - Step 9485: {'lr': 0.0004968519594151966, 'samples': 1821120, 'steps': 9484, 'loss/train': 2.120004653930664} +11/06/2021 22:34:02 - INFO - __main__ - Step 9486: {'lr': 0.0004968511198574147, 'samples': 1821312, 'steps': 9485, 'loss/train': 2.175170660018921} +11/06/2021 22:34:02 - INFO - __main__ - Step 9487: {'lr': 0.0004968502801884056, 'samples': 1821504, 'steps': 9486, 'loss/train': 1.964535117149353} +11/06/2021 22:34:03 - INFO - __main__ - Step 9488: {'lr': 0.0004968494404081695, 'samples': 1821696, 'steps': 9487, 'loss/train': 1.3058781623840332} +11/06/2021 22:34:04 - INFO - __main__ - Step 9489: {'lr': 0.0004968486005167069, 'samples': 1821888, 'steps': 9488, 'loss/train': 1.7480806112289429} +11/06/2021 22:34:04 - INFO - __main__ - Step 9490: {'lr': 0.000496847760514018, 'samples': 1822080, 'steps': 9489, 'loss/train': 1.46340012550354} +11/06/2021 22:34:04 - INFO - __main__ - Step 9491: {'lr': 0.0004968469204001035, 'samples': 1822272, 'steps': 9490, 'loss/train': 2.2288196086883545} +11/06/2021 22:34:05 - INFO - __main__ - Step 9492: {'lr': 0.0004968460801749635, 'samples': 1822464, 'steps': 9491, 'loss/train': 1.707292914390564} +11/06/2021 22:34:05 - INFO - __main__ - Step 9493: {'lr': 0.0004968452398385984, 'samples': 1822656, 'steps': 9492, 'loss/train': 1.734236240386963} +11/06/2021 22:34:06 - INFO - __main__ - Step 9494: {'lr': 0.0004968443993910086, 'samples': 1822848, 'steps': 9493, 'loss/train': 1.8103415966033936} +11/06/2021 22:34:07 - INFO - __main__ - Step 9495: {'lr': 0.0004968435588321947, 'samples': 1823040, 'steps': 9494, 'loss/train': 1.4598149061203003} +11/06/2021 22:34:07 - INFO - __main__ - Step 9496: {'lr': 0.0004968427181621567, 'samples': 1823232, 'steps': 9495, 'loss/train': 1.8984959125518799} +11/06/2021 22:34:07 - INFO - __main__ - Step 9497: {'lr': 0.0004968418773808954, 'samples': 1823424, 'steps': 9496, 'loss/train': 1.705300211906433} +11/06/2021 22:34:08 - INFO - __main__ - Step 9498: {'lr': 0.0004968410364884109, 'samples': 1823616, 'steps': 9497, 'loss/train': 1.6887762546539307} +11/06/2021 22:34:09 - INFO - __main__ - Step 9499: {'lr': 0.0004968401954847035, 'samples': 1823808, 'steps': 9498, 'loss/train': 1.4879417419433594} +11/06/2021 22:34:09 - INFO - __main__ - Step 9500: {'lr': 0.0004968393543697739, 'samples': 1824000, 'steps': 9499, 'loss/train': 1.49965238571167} +11/06/2021 22:34:09 - INFO - __main__ - Step 9501: {'lr': 0.0004968385131436222, 'samples': 1824192, 'steps': 9500, 'loss/train': 1.9283766746520996} +11/06/2021 22:34:10 - INFO - __main__ - Step 9502: {'lr': 0.0004968376718062488, 'samples': 1824384, 'steps': 9501, 'loss/train': 1.9032224416732788} +11/06/2021 22:34:10 - INFO - __main__ - Step 9503: {'lr': 0.0004968368303576542, 'samples': 1824576, 'steps': 9502, 'loss/train': 2.1025607585906982} +11/06/2021 22:34:11 - INFO - __main__ - Step 9504: {'lr': 0.0004968359887978389, 'samples': 1824768, 'steps': 9503, 'loss/train': 0.9440047144889832} +11/06/2021 22:34:11 - INFO - __main__ - Step 9505: {'lr': 0.0004968351471268029, 'samples': 1824960, 'steps': 9504, 'loss/train': 2.4170825481414795} +11/06/2021 22:34:12 - INFO - __main__ - Step 9506: {'lr': 0.0004968343053445469, 'samples': 1825152, 'steps': 9505, 'loss/train': 1.723289132118225} +11/06/2021 22:34:12 - INFO - __main__ - Step 9507: {'lr': 0.0004968334634510712, 'samples': 1825344, 'steps': 9506, 'loss/train': 2.1578383445739746} +11/06/2021 22:34:13 - INFO - __main__ - Step 9508: {'lr': 0.000496832621446376, 'samples': 1825536, 'steps': 9507, 'loss/train': 1.3967469930648804} +11/06/2021 22:34:13 - INFO - __main__ - Step 9509: {'lr': 0.000496831779330462, 'samples': 1825728, 'steps': 9508, 'loss/train': 1.5260154008865356} +11/06/2021 22:34:14 - INFO - __main__ - Step 9510: {'lr': 0.0004968309371033293, 'samples': 1825920, 'steps': 9509, 'loss/train': 1.9803547859191895} +11/06/2021 22:34:14 - INFO - __main__ - Step 9511: {'lr': 0.0004968300947649784, 'samples': 1826112, 'steps': 9510, 'loss/train': 1.811102271080017} +11/06/2021 22:34:15 - INFO - __main__ - Step 9512: {'lr': 0.0004968292523154096, 'samples': 1826304, 'steps': 9511, 'loss/train': 1.6655768156051636} +11/06/2021 22:34:15 - INFO - __main__ - Step 9513: {'lr': 0.0004968284097546235, 'samples': 1826496, 'steps': 9512, 'loss/train': 1.665718913078308} +11/06/2021 22:34:15 - INFO - __main__ - Step 9514: {'lr': 0.0004968275670826204, 'samples': 1826688, 'steps': 9513, 'loss/train': 1.7052531242370605} +11/06/2021 22:34:16 - INFO - __main__ - Step 9515: {'lr': 0.0004968267242994003, 'samples': 1826880, 'steps': 9514, 'loss/train': 1.3750792741775513} +11/06/2021 22:34:17 - INFO - __main__ - Step 9516: {'lr': 0.0004968258814049641, 'samples': 1827072, 'steps': 9515, 'loss/train': 1.3806614875793457} +11/06/2021 22:34:17 - INFO - __main__ - Step 9517: {'lr': 0.0004968250383993119, 'samples': 1827264, 'steps': 9516, 'loss/train': 2.3476414680480957} +11/06/2021 22:34:17 - INFO - __main__ - Step 9518: {'lr': 0.0004968241952824442, 'samples': 1827456, 'steps': 9517, 'loss/train': 1.6158838272094727} +11/06/2021 22:34:18 - INFO - __main__ - Step 9519: {'lr': 0.0004968233520543613, 'samples': 1827648, 'steps': 9518, 'loss/train': 2.4204187393188477} +11/06/2021 22:34:19 - INFO - __main__ - Step 9520: {'lr': 0.0004968225087150636, 'samples': 1827840, 'steps': 9519, 'loss/train': 1.876865267753601} +11/06/2021 22:34:19 - INFO - __main__ - Step 9521: {'lr': 0.0004968216652645515, 'samples': 1828032, 'steps': 9520, 'loss/train': 2.089869737625122} +11/06/2021 22:34:20 - INFO - __main__ - Step 9522: {'lr': 0.0004968208217028254, 'samples': 1828224, 'steps': 9521, 'loss/train': 1.1889524459838867} +11/06/2021 22:34:20 - INFO - __main__ - Step 9523: {'lr': 0.0004968199780298855, 'samples': 1828416, 'steps': 9522, 'loss/train': 1.8859481811523438} +11/06/2021 22:34:20 - INFO - __main__ - Step 9524: {'lr': 0.0004968191342457325, 'samples': 1828608, 'steps': 9523, 'loss/train': 1.6368975639343262} +11/06/2021 22:34:22 - INFO - __main__ - Step 9525: {'lr': 0.0004968182903503665, 'samples': 1828800, 'steps': 9524, 'loss/train': 1.5924121141433716} +11/06/2021 22:34:22 - INFO - __main__ - Step 9526: {'lr': 0.0004968174463437881, 'samples': 1828992, 'steps': 9525, 'loss/train': 1.3622881174087524} +11/06/2021 22:34:22 - INFO - __main__ - Step 9527: {'lr': 0.0004968166022259974, 'samples': 1829184, 'steps': 9526, 'loss/train': 1.6611684560775757} +11/06/2021 22:34:23 - INFO - __main__ - Step 9528: {'lr': 0.0004968157579969951, 'samples': 1829376, 'steps': 9527, 'loss/train': 1.8583652973175049} +11/06/2021 22:34:23 - INFO - __main__ - Step 9529: {'lr': 0.0004968149136567814, 'samples': 1829568, 'steps': 9528, 'loss/train': 1.5691323280334473} +11/06/2021 22:34:23 - INFO - __main__ - Step 9530: {'lr': 0.0004968140692053567, 'samples': 1829760, 'steps': 9529, 'loss/train': 1.7236870527267456} +11/06/2021 22:34:24 - INFO - __main__ - Step 9531: {'lr': 0.0004968132246427212, 'samples': 1829952, 'steps': 9530, 'loss/train': 2.275637149810791} +11/06/2021 22:34:25 - INFO - __main__ - Step 9532: {'lr': 0.0004968123799688757, 'samples': 1830144, 'steps': 9531, 'loss/train': 1.7203338146209717} +11/06/2021 22:34:25 - INFO - __main__ - Step 9533: {'lr': 0.0004968115351838203, 'samples': 1830336, 'steps': 9532, 'loss/train': 2.002017021179199} +11/06/2021 22:34:26 - INFO - __main__ - Step 9534: {'lr': 0.0004968106902875554, 'samples': 1830528, 'steps': 9533, 'loss/train': 1.5515137910842896} +11/06/2021 22:34:26 - INFO - __main__ - Step 9535: {'lr': 0.0004968098452800815, 'samples': 1830720, 'steps': 9534, 'loss/train': 1.9174106121063232} +11/06/2021 22:34:26 - INFO - __main__ - Step 9536: {'lr': 0.0004968090001613987, 'samples': 1830912, 'steps': 9535, 'loss/train': 1.4403159618377686} +11/06/2021 22:34:27 - INFO - __main__ - Step 9537: {'lr': 0.0004968081549315078, 'samples': 1831104, 'steps': 9536, 'loss/train': 1.640446662902832} +11/06/2021 22:34:28 - INFO - __main__ - Step 9538: {'lr': 0.0004968073095904088, 'samples': 1831296, 'steps': 9537, 'loss/train': 1.7125294208526611} +11/06/2021 22:34:28 - INFO - __main__ - Step 9539: {'lr': 0.0004968064641381022, 'samples': 1831488, 'steps': 9538, 'loss/train': 2.010976552963257} +11/06/2021 22:34:28 - INFO - __main__ - Step 9540: {'lr': 0.0004968056185745886, 'samples': 1831680, 'steps': 9539, 'loss/train': 2.09594464302063} +11/06/2021 22:34:29 - INFO - __main__ - Step 9541: {'lr': 0.000496804772899868, 'samples': 1831872, 'steps': 9540, 'loss/train': 1.843455195426941} +11/06/2021 22:34:30 - INFO - __main__ - Step 9542: {'lr': 0.0004968039271139412, 'samples': 1832064, 'steps': 9541, 'loss/train': 2.009514331817627} +11/06/2021 22:34:30 - INFO - __main__ - Step 9543: {'lr': 0.0004968030812168082, 'samples': 1832256, 'steps': 9542, 'loss/train': 1.7577793598175049} +11/06/2021 22:34:30 - INFO - __main__ - Step 9544: {'lr': 0.0004968022352084695, 'samples': 1832448, 'steps': 9543, 'loss/train': 2.0828323364257812} +11/06/2021 22:34:31 - INFO - __main__ - Step 9545: {'lr': 0.0004968013890889256, 'samples': 1832640, 'steps': 9544, 'loss/train': 1.7458568811416626} +11/06/2021 22:34:31 - INFO - __main__ - Step 9546: {'lr': 0.0004968005428581767, 'samples': 1832832, 'steps': 9545, 'loss/train': 2.1240222454071045} +11/06/2021 22:34:32 - INFO - __main__ - Step 9547: {'lr': 0.0004967996965162235, 'samples': 1833024, 'steps': 9546, 'loss/train': 1.8390196561813354} +11/06/2021 22:34:32 - INFO - __main__ - Step 9548: {'lr': 0.0004967988500630661, 'samples': 1833216, 'steps': 9547, 'loss/train': 1.910079836845398} +11/06/2021 22:34:33 - INFO - __main__ - Step 9549: {'lr': 0.0004967980034987048, 'samples': 1833408, 'steps': 9548, 'loss/train': 2.003260374069214} +11/06/2021 22:34:33 - INFO - __main__ - Step 9550: {'lr': 0.0004967971568231402, 'samples': 1833600, 'steps': 9549, 'loss/train': 1.5235668420791626} +11/06/2021 22:34:33 - INFO - __main__ - Step 9551: {'lr': 0.0004967963100363726, 'samples': 1833792, 'steps': 9550, 'loss/train': 1.7840920686721802} +11/06/2021 22:34:35 - INFO - __main__ - Step 9552: {'lr': 0.0004967954631384025, 'samples': 1833984, 'steps': 9551, 'loss/train': 1.2505114078521729} +11/06/2021 22:34:35 - INFO - __main__ - Step 9553: {'lr': 0.00049679461612923, 'samples': 1834176, 'steps': 9552, 'loss/train': 1.4225518703460693} +11/06/2021 22:34:36 - INFO - __main__ - Step 9554: {'lr': 0.0004967937690088558, 'samples': 1834368, 'steps': 9553, 'loss/train': 2.004608154296875} +11/06/2021 22:34:36 - INFO - __main__ - Step 9555: {'lr': 0.0004967929217772801, 'samples': 1834560, 'steps': 9554, 'loss/train': 2.0895955562591553} +11/06/2021 22:34:36 - INFO - __main__ - Step 9556: {'lr': 0.0004967920744345033, 'samples': 1834752, 'steps': 9555, 'loss/train': 0.44858700037002563} +11/06/2021 22:34:37 - INFO - __main__ - Step 9557: {'lr': 0.0004967912269805257, 'samples': 1834944, 'steps': 9556, 'loss/train': 2.1345250606536865} +11/06/2021 22:34:38 - INFO - __main__ - Step 9558: {'lr': 0.000496790379415348, 'samples': 1835136, 'steps': 9557, 'loss/train': 1.6229137182235718} +11/06/2021 22:34:38 - INFO - __main__ - Step 9559: {'lr': 0.0004967895317389702, 'samples': 1835328, 'steps': 9558, 'loss/train': 1.6342477798461914} +11/06/2021 22:34:38 - INFO - __main__ - Step 9560: {'lr': 0.0004967886839513929, 'samples': 1835520, 'steps': 9559, 'loss/train': 1.9332375526428223} +11/06/2021 22:34:39 - INFO - __main__ - Step 9561: {'lr': 0.0004967878360526163, 'samples': 1835712, 'steps': 9560, 'loss/train': 1.733110785484314} +11/06/2021 22:34:39 - INFO - __main__ - Step 9562: {'lr': 0.0004967869880426411, 'samples': 1835904, 'steps': 9561, 'loss/train': 1.7204447984695435} +11/06/2021 22:34:40 - INFO - __main__ - Step 9563: {'lr': 0.0004967861399214674, 'samples': 1836096, 'steps': 9562, 'loss/train': 1.7751929759979248} +11/06/2021 22:34:40 - INFO - __main__ - Step 9564: {'lr': 0.0004967852916890958, 'samples': 1836288, 'steps': 9563, 'loss/train': 1.7982103824615479} +11/06/2021 22:34:41 - INFO - __main__ - Step 9565: {'lr': 0.0004967844433455263, 'samples': 1836480, 'steps': 9564, 'loss/train': 2.2210209369659424} +11/06/2021 22:34:41 - INFO - __main__ - Step 9566: {'lr': 0.0004967835948907598, 'samples': 1836672, 'steps': 9565, 'loss/train': 1.8117777109146118} +11/06/2021 22:34:41 - INFO - __main__ - Step 9567: {'lr': 0.0004967827463247962, 'samples': 1836864, 'steps': 9566, 'loss/train': 1.7700427770614624} +11/06/2021 22:34:42 - INFO - __main__ - Step 9568: {'lr': 0.0004967818976476363, 'samples': 1837056, 'steps': 9567, 'loss/train': 1.9625296592712402} +11/06/2021 22:34:43 - INFO - __main__ - Step 9569: {'lr': 0.0004967810488592801, 'samples': 1837248, 'steps': 9568, 'loss/train': 1.7147427797317505} +11/06/2021 22:34:43 - INFO - __main__ - Step 9570: {'lr': 0.0004967801999597283, 'samples': 1837440, 'steps': 9569, 'loss/train': 1.954040765762329} +11/06/2021 22:34:43 - INFO - __main__ - Step 9571: {'lr': 0.0004967793509489811, 'samples': 1837632, 'steps': 9570, 'loss/train': 2.0516250133514404} +11/06/2021 22:34:44 - INFO - __main__ - Step 9572: {'lr': 0.0004967785018270389, 'samples': 1837824, 'steps': 9571, 'loss/train': 1.2908155918121338} +11/06/2021 22:34:45 - INFO - __main__ - Step 9573: {'lr': 0.0004967776525939022, 'samples': 1838016, 'steps': 9572, 'loss/train': 1.586142897605896} +11/06/2021 22:34:45 - INFO - __main__ - Step 9574: {'lr': 0.0004967768032495712, 'samples': 1838208, 'steps': 9573, 'loss/train': 1.9211750030517578} +11/06/2021 22:34:46 - INFO - __main__ - Step 9575: {'lr': 0.0004967759537940464, 'samples': 1838400, 'steps': 9574, 'loss/train': 6.170900821685791} +11/06/2021 22:34:46 - INFO - __main__ - Step 9576: {'lr': 0.0004967751042273282, 'samples': 1838592, 'steps': 9575, 'loss/train': 2.606065273284912} +11/06/2021 22:34:46 - INFO - __main__ - Step 9577: {'lr': 0.000496774254549417, 'samples': 1838784, 'steps': 9576, 'loss/train': 1.8838642835617065} +11/06/2021 22:34:47 - INFO - __main__ - Step 9578: {'lr': 0.0004967734047603131, 'samples': 1838976, 'steps': 9577, 'loss/train': 1.8725879192352295} +11/06/2021 22:34:48 - INFO - __main__ - Step 9579: {'lr': 0.0004967725548600168, 'samples': 1839168, 'steps': 9578, 'loss/train': 1.7218821048736572} +11/06/2021 22:34:48 - INFO - __main__ - Step 9580: {'lr': 0.0004967717048485287, 'samples': 1839360, 'steps': 9579, 'loss/train': 2.031545400619507} +11/06/2021 22:34:48 - INFO - __main__ - Step 9581: {'lr': 0.000496770854725849, 'samples': 1839552, 'steps': 9580, 'loss/train': 1.9540653228759766} +11/06/2021 22:34:49 - INFO - __main__ - Step 9582: {'lr': 0.0004967700044919783, 'samples': 1839744, 'steps': 9581, 'loss/train': 2.139894485473633} +11/06/2021 22:34:49 - INFO - __main__ - Step 9583: {'lr': 0.0004967691541469167, 'samples': 1839936, 'steps': 9582, 'loss/train': 1.7633771896362305} +11/06/2021 22:34:50 - INFO - __main__ - Step 9584: {'lr': 0.0004967683036906648, 'samples': 1840128, 'steps': 9583, 'loss/train': 2.204907178878784} +11/06/2021 22:34:50 - INFO - __main__ - Step 9585: {'lr': 0.0004967674531232229, 'samples': 1840320, 'steps': 9584, 'loss/train': 1.9411033391952515} +11/06/2021 22:34:51 - INFO - __main__ - Step 9586: {'lr': 0.0004967666024445913, 'samples': 1840512, 'steps': 9585, 'loss/train': 1.1677578687667847} +11/06/2021 22:34:51 - INFO - __main__ - Step 9587: {'lr': 0.0004967657516547707, 'samples': 1840704, 'steps': 9586, 'loss/train': 1.5230824947357178} +11/06/2021 22:34:51 - INFO - __main__ - Step 9588: {'lr': 0.0004967649007537611, 'samples': 1840896, 'steps': 9587, 'loss/train': 1.3074101209640503} +11/06/2021 22:34:52 - INFO - __main__ - Step 9589: {'lr': 0.0004967640497415631, 'samples': 1841088, 'steps': 9588, 'loss/train': 2.527937412261963} +11/06/2021 22:34:53 - INFO - __main__ - Step 9590: {'lr': 0.000496763198618177, 'samples': 1841280, 'steps': 9589, 'loss/train': 2.1263439655303955} +11/06/2021 22:34:53 - INFO - __main__ - Step 9591: {'lr': 0.0004967623473836032, 'samples': 1841472, 'steps': 9590, 'loss/train': 1.8565070629119873} +11/06/2021 22:34:53 - INFO - __main__ - Step 9592: {'lr': 0.0004967614960378421, 'samples': 1841664, 'steps': 9591, 'loss/train': 2.0305135250091553} +11/06/2021 22:34:54 - INFO - __main__ - Step 9593: {'lr': 0.000496760644580894, 'samples': 1841856, 'steps': 9592, 'loss/train': 1.905313491821289} +11/06/2021 22:34:55 - INFO - __main__ - Step 9594: {'lr': 0.0004967597930127595, 'samples': 1842048, 'steps': 9593, 'loss/train': 2.1325924396514893} +11/06/2021 22:34:55 - INFO - __main__ - Step 9595: {'lr': 0.0004967589413334387, 'samples': 1842240, 'steps': 9594, 'loss/train': 1.6247498989105225} +11/06/2021 22:34:56 - INFO - __main__ - Step 9596: {'lr': 0.0004967580895429322, 'samples': 1842432, 'steps': 9595, 'loss/train': 1.7681033611297607} +11/06/2021 22:34:56 - INFO - __main__ - Step 9597: {'lr': 0.0004967572376412405, 'samples': 1842624, 'steps': 9596, 'loss/train': 1.8701852560043335} +11/06/2021 22:34:56 - INFO - __main__ - Step 9598: {'lr': 0.0004967563856283636, 'samples': 1842816, 'steps': 9597, 'loss/train': 1.6864864826202393} +11/06/2021 22:34:58 - INFO - __main__ - Step 9599: {'lr': 0.000496755533504302, 'samples': 1843008, 'steps': 9598, 'loss/train': 1.842852234840393} +11/06/2021 22:34:58 - INFO - __main__ - Step 9600: {'lr': 0.0004967546812690563, 'samples': 1843200, 'steps': 9599, 'loss/train': 1.65439772605896} +11/06/2021 22:34:58 - INFO - __main__ - Step 9601: {'lr': 0.0004967538289226267, 'samples': 1843392, 'steps': 9600, 'loss/train': 1.5017353296279907} +11/06/2021 22:34:59 - INFO - __main__ - Step 9602: {'lr': 0.0004967529764650137, 'samples': 1843584, 'steps': 9601, 'loss/train': 1.895011067390442} +11/06/2021 22:34:59 - INFO - __main__ - Step 9603: {'lr': 0.0004967521238962175, 'samples': 1843776, 'steps': 9602, 'loss/train': 1.7376617193222046} +11/06/2021 22:34:59 - INFO - __main__ - Step 9604: {'lr': 0.0004967512712162387, 'samples': 1843968, 'steps': 9603, 'loss/train': 1.7263696193695068} +11/06/2021 22:35:00 - INFO - __main__ - Step 9605: {'lr': 0.0004967504184250775, 'samples': 1844160, 'steps': 9604, 'loss/train': 2.917311906814575} +11/06/2021 22:35:01 - INFO - __main__ - Step 9606: {'lr': 0.0004967495655227344, 'samples': 1844352, 'steps': 9605, 'loss/train': 2.3843181133270264} +11/06/2021 22:35:01 - INFO - __main__ - Step 9607: {'lr': 0.0004967487125092098, 'samples': 1844544, 'steps': 9606, 'loss/train': 1.349475622177124} +11/06/2021 22:35:02 - INFO - __main__ - Step 9608: {'lr': 0.0004967478593845041, 'samples': 1844736, 'steps': 9607, 'loss/train': 1.40731942653656} +11/06/2021 22:35:02 - INFO - __main__ - Step 9609: {'lr': 0.0004967470061486175, 'samples': 1844928, 'steps': 9608, 'loss/train': 1.621782660484314} +11/06/2021 22:35:02 - INFO - __main__ - Step 9610: {'lr': 0.0004967461528015506, 'samples': 1845120, 'steps': 9609, 'loss/train': 1.7241379022598267} +11/06/2021 22:35:03 - INFO - __main__ - Step 9611: {'lr': 0.0004967452993433036, 'samples': 1845312, 'steps': 9610, 'loss/train': 1.7397297620773315} +11/06/2021 22:35:04 - INFO - __main__ - Step 9612: {'lr': 0.0004967444457738769, 'samples': 1845504, 'steps': 9611, 'loss/train': 1.5325270891189575} +11/06/2021 22:35:04 - INFO - __main__ - Step 9613: {'lr': 0.0004967435920932711, 'samples': 1845696, 'steps': 9612, 'loss/train': 1.8796131610870361} +11/06/2021 22:35:04 - INFO - __main__ - Step 9614: {'lr': 0.0004967427383014865, 'samples': 1845888, 'steps': 9613, 'loss/train': 2.0587081909179688} +11/06/2021 22:35:05 - INFO - __main__ - Step 9615: {'lr': 0.0004967418843985233, 'samples': 1846080, 'steps': 9614, 'loss/train': 1.6247023344039917} +11/06/2021 22:35:06 - INFO - __main__ - Step 9616: {'lr': 0.0004967410303843821, 'samples': 1846272, 'steps': 9615, 'loss/train': 2.14107346534729} +11/06/2021 22:35:06 - INFO - __main__ - Step 9617: {'lr': 0.0004967401762590631, 'samples': 1846464, 'steps': 9616, 'loss/train': 1.674919605255127} +11/06/2021 22:35:06 - INFO - __main__ - Step 9618: {'lr': 0.0004967393220225668, 'samples': 1846656, 'steps': 9617, 'loss/train': 1.9346179962158203} +11/06/2021 22:35:07 - INFO - __main__ - Step 9619: {'lr': 0.0004967384676748936, 'samples': 1846848, 'steps': 9618, 'loss/train': 1.5423815250396729} +11/06/2021 22:35:07 - INFO - __main__ - Step 9620: {'lr': 0.0004967376132160438, 'samples': 1847040, 'steps': 9619, 'loss/train': 2.3580563068389893} +11/06/2021 22:35:08 - INFO - __main__ - Step 9621: {'lr': 0.000496736758646018, 'samples': 1847232, 'steps': 9620, 'loss/train': 1.7103986740112305} +11/06/2021 22:35:09 - INFO - __main__ - Step 9622: {'lr': 0.0004967359039648163, 'samples': 1847424, 'steps': 9621, 'loss/train': 1.5623164176940918} +11/06/2021 22:35:09 - INFO - __main__ - Step 9623: {'lr': 0.0004967350491724392, 'samples': 1847616, 'steps': 9622, 'loss/train': 1.5282793045043945} +11/06/2021 22:35:09 - INFO - __main__ - Step 9624: {'lr': 0.0004967341942688872, 'samples': 1847808, 'steps': 9623, 'loss/train': 1.75148344039917} +11/06/2021 22:35:10 - INFO - __main__ - Step 9625: {'lr': 0.0004967333392541604, 'samples': 1848000, 'steps': 9624, 'loss/train': 1.2734038829803467} +11/06/2021 22:35:11 - INFO - __main__ - Step 9626: {'lr': 0.0004967324841282596, 'samples': 1848192, 'steps': 9625, 'loss/train': 1.7880160808563232} +11/06/2021 22:35:11 - INFO - __main__ - Step 9627: {'lr': 0.0004967316288911847, 'samples': 1848384, 'steps': 9626, 'loss/train': 1.675197958946228} +11/06/2021 22:35:11 - INFO - __main__ - Step 9628: {'lr': 0.0004967307735429365, 'samples': 1848576, 'steps': 9627, 'loss/train': 2.0006182193756104} +11/06/2021 22:35:12 - INFO - __main__ - Step 9629: {'lr': 0.0004967299180835153, 'samples': 1848768, 'steps': 9628, 'loss/train': 1.4124494791030884} +11/06/2021 22:35:12 - INFO - __main__ - Step 9630: {'lr': 0.0004967290625129212, 'samples': 1848960, 'steps': 9629, 'loss/train': 1.5025792121887207} +11/06/2021 22:35:12 - INFO - __main__ - Step 9631: {'lr': 0.0004967282068311548, 'samples': 1849152, 'steps': 9630, 'loss/train': 2.0721802711486816} +11/06/2021 22:35:14 - INFO - __main__ - Step 9632: {'lr': 0.0004967273510382166, 'samples': 1849344, 'steps': 9631, 'loss/train': 1.781577229499817} +11/06/2021 22:35:14 - INFO - __main__ - Step 9633: {'lr': 0.0004967264951341069, 'samples': 1849536, 'steps': 9632, 'loss/train': 1.7446000576019287} +11/06/2021 22:35:14 - INFO - __main__ - Step 9634: {'lr': 0.0004967256391188258, 'samples': 1849728, 'steps': 9633, 'loss/train': 1.9075095653533936} +11/06/2021 22:35:15 - INFO - __main__ - Step 9635: {'lr': 0.0004967247829923742, 'samples': 1849920, 'steps': 9634, 'loss/train': 2.3468635082244873} +11/06/2021 22:35:15 - INFO - __main__ - Step 9636: {'lr': 0.0004967239267547521, 'samples': 1850112, 'steps': 9635, 'loss/train': 1.420114278793335} +11/06/2021 22:35:16 - INFO - __main__ - Step 9637: {'lr': 0.00049672307040596, 'samples': 1850304, 'steps': 9636, 'loss/train': 1.8249211311340332} +11/06/2021 22:35:17 - INFO - __main__ - Step 9638: {'lr': 0.0004967222139459983, 'samples': 1850496, 'steps': 9637, 'loss/train': 0.8801685571670532} +11/06/2021 22:35:17 - INFO - __main__ - Step 9639: {'lr': 0.0004967213573748674, 'samples': 1850688, 'steps': 9638, 'loss/train': 1.8244924545288086} +11/06/2021 22:35:17 - INFO - __main__ - Step 9640: {'lr': 0.0004967205006925677, 'samples': 1850880, 'steps': 9639, 'loss/train': 1.8652440309524536} +11/06/2021 22:35:18 - INFO - __main__ - Step 9641: {'lr': 0.0004967196438990995, 'samples': 1851072, 'steps': 9640, 'loss/train': 1.3965966701507568} +11/06/2021 22:35:18 - INFO - __main__ - Step 9642: {'lr': 0.0004967187869944632, 'samples': 1851264, 'steps': 9641, 'loss/train': 2.0054564476013184} +11/06/2021 22:35:19 - INFO - __main__ - Step 9643: {'lr': 0.0004967179299786593, 'samples': 1851456, 'steps': 9642, 'loss/train': 0.7685950994491577} +11/06/2021 22:35:19 - INFO - __main__ - Step 9644: {'lr': 0.000496717072851688, 'samples': 1851648, 'steps': 9643, 'loss/train': 1.9576327800750732} +11/06/2021 22:35:20 - INFO - __main__ - Step 9645: {'lr': 0.0004967162156135499, 'samples': 1851840, 'steps': 9644, 'loss/train': 1.0496654510498047} +11/06/2021 22:35:20 - INFO - __main__ - Step 9646: {'lr': 0.0004967153582642452, 'samples': 1852032, 'steps': 9645, 'loss/train': 5.934883117675781} +11/06/2021 22:35:21 - INFO - __main__ - Step 9647: {'lr': 0.0004967145008037744, 'samples': 1852224, 'steps': 9646, 'loss/train': 1.2428544759750366} +11/06/2021 22:35:21 - INFO - __main__ - Step 9648: {'lr': 0.000496713643232138, 'samples': 1852416, 'steps': 9647, 'loss/train': 1.7407283782958984} +11/06/2021 22:35:22 - INFO - __main__ - Step 9649: {'lr': 0.000496712785549336, 'samples': 1852608, 'steps': 9648, 'loss/train': 1.9216516017913818} +11/06/2021 22:35:22 - INFO - __main__ - Step 9650: {'lr': 0.0004967119277553692, 'samples': 1852800, 'steps': 9649, 'loss/train': 1.5039646625518799} +11/06/2021 22:35:23 - INFO - __main__ - Step 9651: {'lr': 0.0004967110698502377, 'samples': 1852992, 'steps': 9650, 'loss/train': 1.7824867963790894} +11/06/2021 22:35:23 - INFO - __main__ - Step 9652: {'lr': 0.000496710211833942, 'samples': 1853184, 'steps': 9651, 'loss/train': 1.6737051010131836} +11/06/2021 22:35:24 - INFO - __main__ - Step 9653: {'lr': 0.0004967093537064825, 'samples': 1853376, 'steps': 9652, 'loss/train': 2.1513617038726807} +11/06/2021 22:35:24 - INFO - __main__ - Step 9654: {'lr': 0.0004967084954678597, 'samples': 1853568, 'steps': 9653, 'loss/train': 2.3092923164367676} +11/06/2021 22:35:25 - INFO - __main__ - Step 9655: {'lr': 0.0004967076371180738, 'samples': 1853760, 'steps': 9654, 'loss/train': 1.796209454536438} +11/06/2021 22:35:25 - INFO - __main__ - Step 9656: {'lr': 0.0004967067786571251, 'samples': 1853952, 'steps': 9655, 'loss/train': 1.7951509952545166} +11/06/2021 22:35:25 - INFO - __main__ - Step 9657: {'lr': 0.0004967059200850142, 'samples': 1854144, 'steps': 9656, 'loss/train': 1.7078092098236084} +11/06/2021 22:35:26 - INFO - __main__ - Step 9658: {'lr': 0.0004967050614017415, 'samples': 1854336, 'steps': 9657, 'loss/train': 2.276421546936035} +11/06/2021 22:35:27 - INFO - __main__ - Step 9659: {'lr': 0.0004967042026073073, 'samples': 1854528, 'steps': 9658, 'loss/train': 2.434033155441284} +11/06/2021 22:35:27 - INFO - __main__ - Step 9660: {'lr': 0.000496703343701712, 'samples': 1854720, 'steps': 9659, 'loss/train': 2.1363980770111084} +11/06/2021 22:35:28 - INFO - __main__ - Step 9661: {'lr': 0.0004967024846849558, 'samples': 1854912, 'steps': 9660, 'loss/train': 1.4073458909988403} +11/06/2021 22:35:28 - INFO - __main__ - Step 9662: {'lr': 0.0004967016255570394, 'samples': 1855104, 'steps': 9661, 'loss/train': 1.8968331813812256} +11/06/2021 22:35:28 - INFO - __main__ - Step 9663: {'lr': 0.0004967007663179632, 'samples': 1855296, 'steps': 9662, 'loss/train': 1.9019638299942017} +11/06/2021 22:35:29 - INFO - __main__ - Step 9664: {'lr': 0.0004966999069677272, 'samples': 1855488, 'steps': 9663, 'loss/train': 1.987317681312561} +11/06/2021 22:35:30 - INFO - __main__ - Step 9665: {'lr': 0.0004966990475063321, 'samples': 1855680, 'steps': 9664, 'loss/train': 1.3810869455337524} +11/06/2021 22:35:30 - INFO - __main__ - Step 9666: {'lr': 0.0004966981879337783, 'samples': 1855872, 'steps': 9665, 'loss/train': 1.1948487758636475} +11/06/2021 22:35:30 - INFO - __main__ - Step 9667: {'lr': 0.0004966973282500661, 'samples': 1856064, 'steps': 9666, 'loss/train': 1.8805911540985107} +11/06/2021 22:35:31 - INFO - __main__ - Step 9668: {'lr': 0.0004966964684551958, 'samples': 1856256, 'steps': 9667, 'loss/train': 1.9904563426971436} +11/06/2021 22:35:32 - INFO - __main__ - Step 9669: {'lr': 0.0004966956085491679, 'samples': 1856448, 'steps': 9668, 'loss/train': 1.7589201927185059} +11/06/2021 22:35:32 - INFO - __main__ - Step 9670: {'lr': 0.0004966947485319828, 'samples': 1856640, 'steps': 9669, 'loss/train': 2.156191825866699} +11/06/2021 22:35:32 - INFO - __main__ - Step 9671: {'lr': 0.0004966938884036408, 'samples': 1856832, 'steps': 9670, 'loss/train': 1.8533520698547363} +11/06/2021 22:35:33 - INFO - __main__ - Step 9672: {'lr': 0.0004966930281641423, 'samples': 1857024, 'steps': 9671, 'loss/train': 2.1764333248138428} +11/06/2021 22:35:33 - INFO - __main__ - Step 9673: {'lr': 0.0004966921678134879, 'samples': 1857216, 'steps': 9672, 'loss/train': 2.0473735332489014} +11/06/2021 22:35:34 - INFO - __main__ - Step 9674: {'lr': 0.0004966913073516777, 'samples': 1857408, 'steps': 9673, 'loss/train': 2.0089006423950195} +11/06/2021 22:35:35 - INFO - __main__ - Step 9675: {'lr': 0.0004966904467787123, 'samples': 1857600, 'steps': 9674, 'loss/train': 1.5391348600387573} +11/06/2021 22:35:35 - INFO - __main__ - Step 9676: {'lr': 0.0004966895860945918, 'samples': 1857792, 'steps': 9675, 'loss/train': 0.35723814368247986} +11/06/2021 22:35:35 - INFO - __main__ - Step 9677: {'lr': 0.0004966887252993169, 'samples': 1857984, 'steps': 9676, 'loss/train': 1.9116827249526978} +11/06/2021 22:35:36 - INFO - __main__ - Step 9678: {'lr': 0.0004966878643928879, 'samples': 1858176, 'steps': 9677, 'loss/train': 2.0364251136779785} +11/06/2021 22:35:37 - INFO - __main__ - Step 9679: {'lr': 0.0004966870033753051, 'samples': 1858368, 'steps': 9678, 'loss/train': 2.400313138961792} +11/06/2021 22:35:37 - INFO - __main__ - Step 9680: {'lr': 0.0004966861422465689, 'samples': 1858560, 'steps': 9679, 'loss/train': 1.7770127058029175} +11/06/2021 22:35:37 - INFO - __main__ - Step 9681: {'lr': 0.0004966852810066798, 'samples': 1858752, 'steps': 9680, 'loss/train': 1.5626760721206665} +11/06/2021 22:35:38 - INFO - __main__ - Step 9682: {'lr': 0.0004966844196556382, 'samples': 1858944, 'steps': 9681, 'loss/train': 1.113672137260437} +11/06/2021 22:35:38 - INFO - __main__ - Step 9683: {'lr': 0.0004966835581934442, 'samples': 1859136, 'steps': 9682, 'loss/train': 1.9191310405731201} +11/06/2021 22:35:39 - INFO - __main__ - Step 9684: {'lr': 0.0004966826966200985, 'samples': 1859328, 'steps': 9683, 'loss/train': 1.801482915878296} +11/06/2021 22:35:40 - INFO - __main__ - Step 9685: {'lr': 0.0004966818349356015, 'samples': 1859520, 'steps': 9684, 'loss/train': 2.271620273590088} +11/06/2021 22:35:40 - INFO - __main__ - Step 9686: {'lr': 0.0004966809731399533, 'samples': 1859712, 'steps': 9685, 'loss/train': 1.5356147289276123} +11/06/2021 22:35:40 - INFO - __main__ - Step 9687: {'lr': 0.0004966801112331545, 'samples': 1859904, 'steps': 9686, 'loss/train': 1.8079742193222046} +11/06/2021 22:35:41 - INFO - __main__ - Step 9688: {'lr': 0.0004966792492152054, 'samples': 1860096, 'steps': 9687, 'loss/train': 1.7540109157562256} +11/06/2021 22:35:41 - INFO - __main__ - Step 9689: {'lr': 0.0004966783870861066, 'samples': 1860288, 'steps': 9688, 'loss/train': 1.8654999732971191} +11/06/2021 22:35:42 - INFO - __main__ - Step 9690: {'lr': 0.0004966775248458582, 'samples': 1860480, 'steps': 9689, 'loss/train': 1.8638839721679688} +11/06/2021 22:35:42 - INFO - __main__ - Step 9691: {'lr': 0.0004966766624944607, 'samples': 1860672, 'steps': 9690, 'loss/train': 1.839411735534668} +11/06/2021 22:35:43 - INFO - __main__ - Step 9692: {'lr': 0.0004966758000319147, 'samples': 1860864, 'steps': 9691, 'loss/train': 1.5078877210617065} +11/06/2021 22:35:43 - INFO - __main__ - Step 9693: {'lr': 0.0004966749374582202, 'samples': 1861056, 'steps': 9692, 'loss/train': 2.1486093997955322} +11/06/2021 22:35:43 - INFO - __main__ - Step 9694: {'lr': 0.0004966740747733778, 'samples': 1861248, 'steps': 9693, 'loss/train': 2.061601161956787} +11/06/2021 22:35:44 - INFO - __main__ - Step 9695: {'lr': 0.0004966732119773879, 'samples': 1861440, 'steps': 9694, 'loss/train': 1.997467279434204} +11/06/2021 22:35:45 - INFO - __main__ - Step 9696: {'lr': 0.0004966723490702509, 'samples': 1861632, 'steps': 9695, 'loss/train': 1.515207052230835} +11/06/2021 22:35:45 - INFO - __main__ - Step 9697: {'lr': 0.000496671486051967, 'samples': 1861824, 'steps': 9696, 'loss/train': 1.542418122291565} +11/06/2021 22:35:45 - INFO - __main__ - Step 9698: {'lr': 0.0004966706229225368, 'samples': 1862016, 'steps': 9697, 'loss/train': 1.7097152471542358} +11/06/2021 22:35:46 - INFO - __main__ - Step 9699: {'lr': 0.0004966697596819607, 'samples': 1862208, 'steps': 9698, 'loss/train': 1.9859890937805176} +11/06/2021 22:35:47 - INFO - __main__ - Step 9700: {'lr': 0.0004966688963302389, 'samples': 1862400, 'steps': 9699, 'loss/train': 1.6902731657028198} +11/06/2021 22:35:47 - INFO - __main__ - Step 9701: {'lr': 0.000496668032867372, 'samples': 1862592, 'steps': 9700, 'loss/train': 2.2249433994293213} +11/06/2021 22:35:48 - INFO - __main__ - Step 9702: {'lr': 0.0004966671692933603, 'samples': 1862784, 'steps': 9701, 'loss/train': 2.1209845542907715} +11/06/2021 22:35:48 - INFO - __main__ - Step 9703: {'lr': 0.0004966663056082041, 'samples': 1862976, 'steps': 9702, 'loss/train': 2.0231058597564697} +11/06/2021 22:35:48 - INFO - __main__ - Step 9704: {'lr': 0.0004966654418119039, 'samples': 1863168, 'steps': 9703, 'loss/train': 1.7849528789520264} +11/06/2021 22:35:49 - INFO - __main__ - Step 9705: {'lr': 0.00049666457790446, 'samples': 1863360, 'steps': 9704, 'loss/train': 1.677087664604187} +11/06/2021 22:35:49 - INFO - __main__ - Step 9706: {'lr': 0.000496663713885873, 'samples': 1863552, 'steps': 9705, 'loss/train': 1.6094074249267578} +11/06/2021 22:35:50 - INFO - __main__ - Step 9707: {'lr': 0.0004966628497561431, 'samples': 1863744, 'steps': 9706, 'loss/train': 1.4655191898345947} +11/06/2021 22:35:50 - INFO - __main__ - Step 9708: {'lr': 0.0004966619855152706, 'samples': 1863936, 'steps': 9707, 'loss/train': 1.6858545541763306} +11/06/2021 22:35:51 - INFO - __main__ - Step 9709: {'lr': 0.0004966611211632561, 'samples': 1864128, 'steps': 9708, 'loss/train': 2.7526583671569824} +11/06/2021 22:35:51 - INFO - __main__ - Step 9710: {'lr': 0.0004966602567000999, 'samples': 1864320, 'steps': 9709, 'loss/train': 1.8276556730270386} +11/06/2021 22:35:52 - INFO - __main__ - Step 9711: {'lr': 0.0004966593921258023, 'samples': 1864512, 'steps': 9710, 'loss/train': 2.059382677078247} +11/06/2021 22:35:52 - INFO - __main__ - Step 9712: {'lr': 0.000496658527440364, 'samples': 1864704, 'steps': 9711, 'loss/train': 1.3967629671096802} +11/06/2021 22:35:53 - INFO - __main__ - Step 9713: {'lr': 0.000496657662643785, 'samples': 1864896, 'steps': 9712, 'loss/train': 1.2711286544799805} +11/06/2021 22:35:53 - INFO - __main__ - Step 9714: {'lr': 0.000496656797736066, 'samples': 1865088, 'steps': 9713, 'loss/train': 1.6706697940826416} +11/06/2021 22:35:53 - INFO - __main__ - Step 9715: {'lr': 0.0004966559327172071, 'samples': 1865280, 'steps': 9714, 'loss/train': 1.8991764783859253} +11/06/2021 22:35:54 - INFO - __main__ - Step 9716: {'lr': 0.0004966550675872089, 'samples': 1865472, 'steps': 9715, 'loss/train': 0.8012776970863342} +11/06/2021 22:35:55 - INFO - __main__ - Step 9717: {'lr': 0.0004966542023460718, 'samples': 1865664, 'steps': 9716, 'loss/train': 1.5615832805633545} +11/06/2021 22:35:55 - INFO - __main__ - Step 9718: {'lr': 0.000496653336993796, 'samples': 1865856, 'steps': 9717, 'loss/train': 1.8252805471420288} +11/06/2021 22:35:55 - INFO - __main__ - Step 9719: {'lr': 0.0004966524715303821, 'samples': 1866048, 'steps': 9718, 'loss/train': 1.7340925931930542} +11/06/2021 22:35:56 - INFO - __main__ - Step 9720: {'lr': 0.0004966516059558304, 'samples': 1866240, 'steps': 9719, 'loss/train': 1.9591999053955078} +11/06/2021 22:35:57 - INFO - __main__ - Step 9721: {'lr': 0.0004966507402701413, 'samples': 1866432, 'steps': 9720, 'loss/train': 1.574877142906189} +11/06/2021 22:35:57 - INFO - __main__ - Step 9722: {'lr': 0.0004966498744733151, 'samples': 1866624, 'steps': 9721, 'loss/train': 1.7162398099899292} +11/06/2021 22:35:58 - INFO - __main__ - Step 9723: {'lr': 0.0004966490085653523, 'samples': 1866816, 'steps': 9722, 'loss/train': 1.3233344554901123} +11/06/2021 22:35:58 - INFO - __main__ - Step 9724: {'lr': 0.0004966481425462533, 'samples': 1867008, 'steps': 9723, 'loss/train': 2.0228872299194336} +11/06/2021 22:35:58 - INFO - __main__ - Step 9725: {'lr': 0.0004966472764160183, 'samples': 1867200, 'steps': 9724, 'loss/train': 2.029508590698242} +11/06/2021 22:35:59 - INFO - __main__ - Step 9726: {'lr': 0.000496646410174648, 'samples': 1867392, 'steps': 9725, 'loss/train': 2.0226128101348877} +11/06/2021 22:36:00 - INFO - __main__ - Step 9727: {'lr': 0.0004966455438221427, 'samples': 1867584, 'steps': 9726, 'loss/train': 1.7145023345947266} +11/06/2021 22:36:00 - INFO - __main__ - Step 9728: {'lr': 0.0004966446773585026, 'samples': 1867776, 'steps': 9727, 'loss/train': 1.7100311517715454} +11/06/2021 22:36:00 - INFO - __main__ - Step 9729: {'lr': 0.0004966438107837283, 'samples': 1867968, 'steps': 9728, 'loss/train': 1.7535374164581299} +11/06/2021 22:36:01 - INFO - __main__ - Step 9730: {'lr': 0.00049664294409782, 'samples': 1868160, 'steps': 9729, 'loss/train': 1.442859172821045} +11/06/2021 22:36:01 - INFO - __main__ - Step 9731: {'lr': 0.0004966420773007782, 'samples': 1868352, 'steps': 9730, 'loss/train': 1.5532867908477783} +11/06/2021 22:36:02 - INFO - __main__ - Step 9732: {'lr': 0.0004966412103926034, 'samples': 1868544, 'steps': 9731, 'loss/train': 1.9052324295043945} +11/06/2021 22:36:02 - INFO - __main__ - Step 9733: {'lr': 0.0004966403433732958, 'samples': 1868736, 'steps': 9732, 'loss/train': 1.7569751739501953} +11/06/2021 22:36:03 - INFO - __main__ - Step 9734: {'lr': 0.0004966394762428559, 'samples': 1868928, 'steps': 9733, 'loss/train': 1.3910471200942993} +11/06/2021 22:36:03 - INFO - __main__ - Step 9735: {'lr': 0.0004966386090012841, 'samples': 1869120, 'steps': 9734, 'loss/train': 1.8945108652114868} +11/06/2021 22:36:03 - INFO - __main__ - Step 9736: {'lr': 0.0004966377416485806, 'samples': 1869312, 'steps': 9735, 'loss/train': 2.4226298332214355} +11/06/2021 22:36:05 - INFO - __main__ - Step 9737: {'lr': 0.0004966368741847461, 'samples': 1869504, 'steps': 9736, 'loss/train': 1.5357730388641357} +11/06/2021 22:36:05 - INFO - __main__ - Step 9738: {'lr': 0.0004966360066097807, 'samples': 1869696, 'steps': 9737, 'loss/train': 1.4675438404083252} +11/06/2021 22:36:05 - INFO - __main__ - Step 9739: {'lr': 0.0004966351389236851, 'samples': 1869888, 'steps': 9738, 'loss/train': 1.7604131698608398} +11/06/2021 22:36:06 - INFO - __main__ - Step 9740: {'lr': 0.0004966342711264593, 'samples': 1870080, 'steps': 9739, 'loss/train': 2.1939752101898193} +11/06/2021 22:36:06 - INFO - __main__ - Step 9741: {'lr': 0.000496633403218104, 'samples': 1870272, 'steps': 9740, 'loss/train': 1.855295181274414} +11/06/2021 22:36:07 - INFO - __main__ - Step 9742: {'lr': 0.0004966325351986195, 'samples': 1870464, 'steps': 9741, 'loss/train': 2.2889838218688965} +11/06/2021 22:36:07 - INFO - __main__ - Step 9743: {'lr': 0.0004966316670680062, 'samples': 1870656, 'steps': 9742, 'loss/train': 1.9611015319824219} +11/06/2021 22:36:08 - INFO - __main__ - Step 9744: {'lr': 0.0004966307988262644, 'samples': 1870848, 'steps': 9743, 'loss/train': 1.9820667505264282} +11/06/2021 22:36:08 - INFO - __main__ - Step 9745: {'lr': 0.0004966299304733947, 'samples': 1871040, 'steps': 9744, 'loss/train': 1.8761732578277588} +11/06/2021 22:36:08 - INFO - __main__ - Step 9746: {'lr': 0.0004966290620093972, 'samples': 1871232, 'steps': 9745, 'loss/train': 1.9568790197372437} +11/06/2021 22:36:09 - INFO - __main__ - Step 9747: {'lr': 0.0004966281934342725, 'samples': 1871424, 'steps': 9746, 'loss/train': 1.7533879280090332} +11/06/2021 22:36:10 - INFO - __main__ - Step 9748: {'lr': 0.000496627324748021, 'samples': 1871616, 'steps': 9747, 'loss/train': 2.03949236869812} +11/06/2021 22:36:10 - INFO - __main__ - Step 9749: {'lr': 0.000496626455950643, 'samples': 1871808, 'steps': 9748, 'loss/train': 2.50878643989563} +11/06/2021 22:36:10 - INFO - __main__ - Step 9750: {'lr': 0.000496625587042139, 'samples': 1872000, 'steps': 9749, 'loss/train': 1.5603324174880981} +11/06/2021 22:36:11 - INFO - __main__ - Step 9751: {'lr': 0.0004966247180225092, 'samples': 1872192, 'steps': 9750, 'loss/train': 1.700454592704773} +11/06/2021 22:36:11 - INFO - __main__ - Step 9752: {'lr': 0.0004966238488917542, 'samples': 1872384, 'steps': 9751, 'loss/train': 0.7267507910728455} +11/06/2021 22:36:12 - INFO - __main__ - Step 9753: {'lr': 0.0004966229796498742, 'samples': 1872576, 'steps': 9752, 'loss/train': 1.431842565536499} +11/06/2021 22:36:13 - INFO - __main__ - Step 9754: {'lr': 0.0004966221102968698, 'samples': 1872768, 'steps': 9753, 'loss/train': 1.7751144170761108} +11/06/2021 22:36:13 - INFO - __main__ - Step 9755: {'lr': 0.0004966212408327412, 'samples': 1872960, 'steps': 9754, 'loss/train': 1.7627856731414795} +11/06/2021 22:36:13 - INFO - __main__ - Step 9756: {'lr': 0.0004966203712574889, 'samples': 1873152, 'steps': 9755, 'loss/train': 2.068781852722168} +11/06/2021 22:36:14 - INFO - __main__ - Step 9757: {'lr': 0.0004966195015711132, 'samples': 1873344, 'steps': 9756, 'loss/train': 1.8314954042434692} +11/06/2021 22:36:15 - INFO - __main__ - Step 9758: {'lr': 0.0004966186317736146, 'samples': 1873536, 'steps': 9757, 'loss/train': 1.5385262966156006} +11/06/2021 22:36:15 - INFO - __main__ - Step 9759: {'lr': 0.0004966177618649935, 'samples': 1873728, 'steps': 9758, 'loss/train': 2.23832106590271} +11/06/2021 22:36:15 - INFO - __main__ - Step 9760: {'lr': 0.0004966168918452503, 'samples': 1873920, 'steps': 9759, 'loss/train': 2.2789201736450195} +11/06/2021 22:36:16 - INFO - __main__ - Step 9761: {'lr': 0.0004966160217143852, 'samples': 1874112, 'steps': 9760, 'loss/train': 1.4507635831832886} +11/06/2021 22:36:16 - INFO - __main__ - Step 9762: {'lr': 0.0004966151514723988, 'samples': 1874304, 'steps': 9761, 'loss/train': 1.7444387674331665} +11/06/2021 22:36:17 - INFO - __main__ - Step 9763: {'lr': 0.0004966142811192914, 'samples': 1874496, 'steps': 9762, 'loss/train': 2.5484769344329834} +11/06/2021 22:36:17 - INFO - __main__ - Step 9764: {'lr': 0.0004966134106550634, 'samples': 1874688, 'steps': 9763, 'loss/train': 2.3604612350463867} +11/06/2021 22:36:18 - INFO - __main__ - Step 9765: {'lr': 0.0004966125400797152, 'samples': 1874880, 'steps': 9764, 'loss/train': 1.8499844074249268} +11/06/2021 22:36:18 - INFO - __main__ - Step 9766: {'lr': 0.0004966116693932472, 'samples': 1875072, 'steps': 9765, 'loss/train': 2.1143555641174316} +11/06/2021 22:36:18 - INFO - __main__ - Step 9767: {'lr': 0.0004966107985956598, 'samples': 1875264, 'steps': 9766, 'loss/train': 1.2633049488067627} +11/06/2021 22:36:19 - INFO - __main__ - Step 9768: {'lr': 0.0004966099276869534, 'samples': 1875456, 'steps': 9767, 'loss/train': 1.519136667251587} +11/06/2021 22:36:20 - INFO - __main__ - Step 9769: {'lr': 0.0004966090566671283, 'samples': 1875648, 'steps': 9768, 'loss/train': 1.8271578550338745} +11/06/2021 22:36:20 - INFO - __main__ - Step 9770: {'lr': 0.000496608185536185, 'samples': 1875840, 'steps': 9769, 'loss/train': 1.837522268295288} +11/06/2021 22:36:20 - INFO - __main__ - Step 9771: {'lr': 0.0004966073142941239, 'samples': 1876032, 'steps': 9770, 'loss/train': 2.2010583877563477} +11/06/2021 22:36:21 - INFO - __main__ - Step 9772: {'lr': 0.0004966064429409452, 'samples': 1876224, 'steps': 9771, 'loss/train': 1.9248576164245605} +11/06/2021 22:36:22 - INFO - __main__ - Step 9773: {'lr': 0.0004966055714766496, 'samples': 1876416, 'steps': 9772, 'loss/train': 2.22214412689209} +11/06/2021 22:36:22 - INFO - __main__ - Step 9774: {'lr': 0.0004966046999012373, 'samples': 1876608, 'steps': 9773, 'loss/train': 1.0785945653915405} +11/06/2021 22:36:22 - INFO - __main__ - Step 9775: {'lr': 0.0004966038282147087, 'samples': 1876800, 'steps': 9774, 'loss/train': 1.5319066047668457} +11/06/2021 22:36:23 - INFO - __main__ - Step 9776: {'lr': 0.0004966029564170643, 'samples': 1876992, 'steps': 9775, 'loss/train': 1.8373252153396606} +11/06/2021 22:36:23 - INFO - __main__ - Step 9777: {'lr': 0.0004966020845083044, 'samples': 1877184, 'steps': 9776, 'loss/train': 1.9333018064498901} +11/06/2021 22:36:24 - INFO - __main__ - Step 9778: {'lr': 0.0004966012124884292, 'samples': 1877376, 'steps': 9777, 'loss/train': 1.7784291505813599} +11/06/2021 22:36:24 - INFO - __main__ - Step 9779: {'lr': 0.0004966003403574395, 'samples': 1877568, 'steps': 9778, 'loss/train': 2.0057530403137207} +11/06/2021 22:36:25 - INFO - __main__ - Step 9780: {'lr': 0.0004965994681153355, 'samples': 1877760, 'steps': 9779, 'loss/train': 1.3653117418289185} +11/06/2021 22:36:25 - INFO - __main__ - Step 9781: {'lr': 0.0004965985957621175, 'samples': 1877952, 'steps': 9780, 'loss/train': 1.5184459686279297} +11/06/2021 22:36:26 - INFO - __main__ - Step 9782: {'lr': 0.0004965977232977861, 'samples': 1878144, 'steps': 9781, 'loss/train': 1.0429720878601074} +11/06/2021 22:36:26 - INFO - __main__ - Step 9783: {'lr': 0.0004965968507223414, 'samples': 1878336, 'steps': 9782, 'loss/train': 1.5216965675354004} +11/06/2021 22:36:27 - INFO - __main__ - Step 9784: {'lr': 0.000496595978035784, 'samples': 1878528, 'steps': 9783, 'loss/train': 1.9085612297058105} +11/06/2021 22:36:27 - INFO - __main__ - Step 9785: {'lr': 0.0004965951052381144, 'samples': 1878720, 'steps': 9784, 'loss/train': 1.6528103351593018} +11/06/2021 22:36:28 - INFO - __main__ - Step 9786: {'lr': 0.0004965942323293328, 'samples': 1878912, 'steps': 9785, 'loss/train': 1.703324317932129} +11/06/2021 22:36:28 - INFO - __main__ - Step 9787: {'lr': 0.0004965933593094395, 'samples': 1879104, 'steps': 9786, 'loss/train': 1.8389208316802979} +11/06/2021 22:36:28 - INFO - __main__ - Step 9788: {'lr': 0.0004965924861784352, 'samples': 1879296, 'steps': 9787, 'loss/train': 2.069736957550049} +11/06/2021 22:36:29 - INFO - __main__ - Step 9789: {'lr': 0.0004965916129363201, 'samples': 1879488, 'steps': 9788, 'loss/train': 1.9471229314804077} +11/06/2021 22:36:30 - INFO - __main__ - Step 9790: {'lr': 0.0004965907395830945, 'samples': 1879680, 'steps': 9789, 'loss/train': 1.7488764524459839} +11/06/2021 22:36:30 - INFO - __main__ - Step 9791: {'lr': 0.000496589866118759, 'samples': 1879872, 'steps': 9790, 'loss/train': 2.344801902770996} +11/06/2021 22:36:30 - INFO - __main__ - Step 9792: {'lr': 0.000496588992543314, 'samples': 1880064, 'steps': 9791, 'loss/train': 1.8304022550582886} +11/06/2021 22:36:31 - INFO - __main__ - Step 9793: {'lr': 0.0004965881188567597, 'samples': 1880256, 'steps': 9792, 'loss/train': 1.6867663860321045} +11/06/2021 22:36:32 - INFO - __main__ - Step 9794: {'lr': 0.0004965872450590965, 'samples': 1880448, 'steps': 9793, 'loss/train': 1.4658312797546387} +11/06/2021 22:36:32 - INFO - __main__ - Step 9795: {'lr': 0.0004965863711503251, 'samples': 1880640, 'steps': 9794, 'loss/train': 2.786965847015381} +11/06/2021 22:36:33 - INFO - __main__ - Step 9796: {'lr': 0.0004965854971304457, 'samples': 1880832, 'steps': 9795, 'loss/train': 1.9178855419158936} +11/06/2021 22:36:33 - INFO - __main__ - Step 9797: {'lr': 0.0004965846229994586, 'samples': 1881024, 'steps': 9796, 'loss/train': 1.2724156379699707} +11/06/2021 22:36:34 - INFO - __main__ - Step 9798: {'lr': 0.0004965837487573641, 'samples': 1881216, 'steps': 9797, 'loss/train': 2.09515380859375} +11/06/2021 22:36:35 - INFO - __main__ - Step 9799: {'lr': 0.000496582874404163, 'samples': 1881408, 'steps': 9798, 'loss/train': 0.2936389148235321} +11/06/2021 22:36:35 - INFO - __main__ - Step 9800: {'lr': 0.0004965819999398554, 'samples': 1881600, 'steps': 9799, 'loss/train': 1.556630253791809} +11/06/2021 22:36:35 - INFO - __main__ - Step 9801: {'lr': 0.0004965811253644418, 'samples': 1881792, 'steps': 9800, 'loss/train': 1.5148653984069824} +11/06/2021 22:36:36 - INFO - __main__ - Step 9802: {'lr': 0.0004965802506779225, 'samples': 1881984, 'steps': 9801, 'loss/train': 1.8393759727478027} +11/06/2021 22:36:36 - INFO - __main__ - Step 9803: {'lr': 0.0004965793758802978, 'samples': 1882176, 'steps': 9802, 'loss/train': 1.732246994972229} +11/06/2021 22:36:37 - INFO - __main__ - Step 9804: {'lr': 0.0004965785009715684, 'samples': 1882368, 'steps': 9803, 'loss/train': 1.4041547775268555} +11/06/2021 22:36:37 - INFO - __main__ - Step 9805: {'lr': 0.0004965776259517345, 'samples': 1882560, 'steps': 9804, 'loss/train': 1.8803133964538574} +11/06/2021 22:36:38 - INFO - __main__ - Step 9806: {'lr': 0.0004965767508207966, 'samples': 1882752, 'steps': 9805, 'loss/train': 1.2590349912643433} +11/06/2021 22:36:38 - INFO - __main__ - Step 9807: {'lr': 0.000496575875578755, 'samples': 1882944, 'steps': 9806, 'loss/train': 2.212789535522461} +11/06/2021 22:36:38 - INFO - __main__ - Step 9808: {'lr': 0.00049657500022561, 'samples': 1883136, 'steps': 9807, 'loss/train': 1.9373009204864502} +11/06/2021 22:36:39 - INFO - __main__ - Step 9809: {'lr': 0.0004965741247613622, 'samples': 1883328, 'steps': 9808, 'loss/train': 0.9651688933372498} +11/06/2021 22:36:40 - INFO - __main__ - Step 9810: {'lr': 0.0004965732491860119, 'samples': 1883520, 'steps': 9809, 'loss/train': 2.099937915802002} +11/06/2021 22:36:40 - INFO - __main__ - Step 9811: {'lr': 0.0004965723734995594, 'samples': 1883712, 'steps': 9810, 'loss/train': 1.7372392416000366} +11/06/2021 22:36:40 - INFO - __main__ - Step 9812: {'lr': 0.0004965714977020053, 'samples': 1883904, 'steps': 9811, 'loss/train': 1.6284079551696777} +11/06/2021 22:36:41 - INFO - __main__ - Step 9813: {'lr': 0.0004965706217933499, 'samples': 1884096, 'steps': 9812, 'loss/train': 1.849391222000122} +11/06/2021 22:36:41 - INFO - __main__ - Step 9814: {'lr': 0.0004965697457735936, 'samples': 1884288, 'steps': 9813, 'loss/train': 1.648018717765808} +11/06/2021 22:36:42 - INFO - __main__ - Step 9815: {'lr': 0.0004965688696427366, 'samples': 1884480, 'steps': 9814, 'loss/train': 1.7322882413864136} +11/06/2021 22:36:42 - INFO - __main__ - Step 9816: {'lr': 0.0004965679934007797, 'samples': 1884672, 'steps': 9815, 'loss/train': 1.7675822973251343} +11/06/2021 22:36:43 - INFO - __main__ - Step 9817: {'lr': 0.0004965671170477229, 'samples': 1884864, 'steps': 9816, 'loss/train': 1.9023000001907349} +11/06/2021 22:36:43 - INFO - __main__ - Step 9818: {'lr': 0.0004965662405835668, 'samples': 1885056, 'steps': 9817, 'loss/train': 1.9403313398361206} +11/06/2021 22:36:43 - INFO - __main__ - Step 9819: {'lr': 0.0004965653640083118, 'samples': 1885248, 'steps': 9818, 'loss/train': 0.30051112174987793} +11/06/2021 22:36:45 - INFO - __main__ - Step 9820: {'lr': 0.0004965644873219583, 'samples': 1885440, 'steps': 9819, 'loss/train': 1.5804340839385986} +11/06/2021 22:36:45 - INFO - __main__ - Step 9821: {'lr': 0.0004965636105245066, 'samples': 1885632, 'steps': 9820, 'loss/train': 3.80881404876709} +11/06/2021 22:36:45 - INFO - __main__ - Step 9822: {'lr': 0.000496562733615957, 'samples': 1885824, 'steps': 9821, 'loss/train': 1.808201551437378} +11/06/2021 22:36:46 - INFO - __main__ - Step 9823: {'lr': 0.0004965618565963102, 'samples': 1886016, 'steps': 9822, 'loss/train': 1.3552080392837524} +11/06/2021 22:36:46 - INFO - __main__ - Step 9824: {'lr': 0.0004965609794655664, 'samples': 1886208, 'steps': 9823, 'loss/train': 1.8378883600234985} +11/06/2021 22:36:47 - INFO - __main__ - Step 9825: {'lr': 0.0004965601022237261, 'samples': 1886400, 'steps': 9824, 'loss/train': 1.9869000911712646} +11/06/2021 22:36:47 - INFO - __main__ - Step 9826: {'lr': 0.0004965592248707895, 'samples': 1886592, 'steps': 9825, 'loss/train': 1.6496671438217163} +11/06/2021 22:36:48 - INFO - __main__ - Step 9827: {'lr': 0.0004965583474067571, 'samples': 1886784, 'steps': 9826, 'loss/train': 1.5552690029144287} +11/06/2021 22:36:48 - INFO - __main__ - Step 9828: {'lr': 0.0004965574698316294, 'samples': 1886976, 'steps': 9827, 'loss/train': 1.9440776109695435} +11/06/2021 22:36:48 - INFO - __main__ - Step 9829: {'lr': 0.0004965565921454067, 'samples': 1887168, 'steps': 9828, 'loss/train': 1.336730718612671} +11/06/2021 22:36:49 - INFO - __main__ - Step 9830: {'lr': 0.0004965557143480893, 'samples': 1887360, 'steps': 9829, 'loss/train': 0.4165128171443939} +11/06/2021 22:36:50 - INFO - __main__ - Step 9831: {'lr': 0.0004965548364396779, 'samples': 1887552, 'steps': 9830, 'loss/train': 1.5435590744018555} +11/06/2021 22:36:50 - INFO - __main__ - Step 9832: {'lr': 0.0004965539584201725, 'samples': 1887744, 'steps': 9831, 'loss/train': 1.4158097505569458} +11/06/2021 22:36:50 - INFO - __main__ - Step 9833: {'lr': 0.0004965530802895738, 'samples': 1887936, 'steps': 9832, 'loss/train': 1.8684687614440918} +11/06/2021 22:36:51 - INFO - __main__ - Step 9834: {'lr': 0.000496552202047882, 'samples': 1888128, 'steps': 9833, 'loss/train': 2.1222503185272217} +11/06/2021 22:36:52 - INFO - __main__ - Step 9835: {'lr': 0.0004965513236950977, 'samples': 1888320, 'steps': 9834, 'loss/train': 1.6643342971801758} +11/06/2021 22:36:52 - INFO - __main__ - Step 9836: {'lr': 0.0004965504452312211, 'samples': 1888512, 'steps': 9835, 'loss/train': 1.892832636833191} +11/06/2021 22:36:53 - INFO - __main__ - Step 9837: {'lr': 0.0004965495666562527, 'samples': 1888704, 'steps': 9836, 'loss/train': 1.7342534065246582} +11/06/2021 22:36:53 - INFO - __main__ - Step 9838: {'lr': 0.0004965486879701928, 'samples': 1888896, 'steps': 9837, 'loss/train': 1.782392978668213} +11/06/2021 22:36:53 - INFO - __main__ - Step 9839: {'lr': 0.000496547809173042, 'samples': 1889088, 'steps': 9838, 'loss/train': 5.928685665130615} +11/06/2021 22:36:54 - INFO - __main__ - Step 9840: {'lr': 0.0004965469302648005, 'samples': 1889280, 'steps': 9839, 'loss/train': 2.1997225284576416} +11/06/2021 22:36:55 - INFO - __main__ - Step 9841: {'lr': 0.0004965460512454688, 'samples': 1889472, 'steps': 9840, 'loss/train': 1.9922882318496704} +11/06/2021 22:36:55 - INFO - __main__ - Step 9842: {'lr': 0.0004965451721150471, 'samples': 1889664, 'steps': 9841, 'loss/train': 1.385520100593567} +11/06/2021 22:36:55 - INFO - __main__ - Step 9843: {'lr': 0.0004965442928735361, 'samples': 1889856, 'steps': 9842, 'loss/train': 1.5797951221466064} +11/06/2021 22:36:56 - INFO - __main__ - Step 9844: {'lr': 0.000496543413520936, 'samples': 1890048, 'steps': 9843, 'loss/train': 1.9805771112442017} +11/06/2021 22:36:56 - INFO - __main__ - Step 9845: {'lr': 0.0004965425340572472, 'samples': 1890240, 'steps': 9844, 'loss/train': 2.120030403137207} +11/06/2021 22:36:57 - INFO - __main__ - Step 9846: {'lr': 0.0004965416544824703, 'samples': 1890432, 'steps': 9845, 'loss/train': 1.6327179670333862} +11/06/2021 22:36:58 - INFO - __main__ - Step 9847: {'lr': 0.0004965407747966053, 'samples': 1890624, 'steps': 9846, 'loss/train': 1.7754491567611694} +11/06/2021 22:36:58 - INFO - __main__ - Step 9848: {'lr': 0.000496539894999653, 'samples': 1890816, 'steps': 9847, 'loss/train': 1.8676059246063232} +11/06/2021 22:36:59 - INFO - __main__ - Step 9849: {'lr': 0.0004965390150916136, 'samples': 1891008, 'steps': 9848, 'loss/train': 1.9253339767456055} +11/06/2021 22:36:59 - INFO - __main__ - Step 9850: {'lr': 0.0004965381350724874, 'samples': 1891200, 'steps': 9849, 'loss/train': 1.7396340370178223} +11/06/2021 22:36:59 - INFO - __main__ - Step 9851: {'lr': 0.000496537254942275, 'samples': 1891392, 'steps': 9850, 'loss/train': 1.8926670551300049} +11/06/2021 22:37:00 - INFO - __main__ - Step 9852: {'lr': 0.0004965363747009767, 'samples': 1891584, 'steps': 9851, 'loss/train': 1.3262872695922852} +11/06/2021 22:37:01 - INFO - __main__ - Step 9853: {'lr': 0.000496535494348593, 'samples': 1891776, 'steps': 9852, 'loss/train': 1.9677116870880127} +11/06/2021 22:37:01 - INFO - __main__ - Step 9854: {'lr': 0.0004965346138851241, 'samples': 1891968, 'steps': 9853, 'loss/train': 1.1874512434005737} +11/06/2021 22:37:01 - INFO - __main__ - Step 9855: {'lr': 0.0004965337333105706, 'samples': 1892160, 'steps': 9854, 'loss/train': 2.6719613075256348} +11/06/2021 22:37:02 - INFO - __main__ - Step 9856: {'lr': 0.0004965328526249328, 'samples': 1892352, 'steps': 9855, 'loss/train': 1.6148555278778076} +11/06/2021 22:37:03 - INFO - __main__ - Step 9857: {'lr': 0.000496531971828211, 'samples': 1892544, 'steps': 9856, 'loss/train': 1.9275423288345337} +11/06/2021 22:37:03 - INFO - __main__ - Step 9858: {'lr': 0.0004965310909204058, 'samples': 1892736, 'steps': 9857, 'loss/train': 2.38356876373291} +11/06/2021 22:37:03 - INFO - __main__ - Step 9859: {'lr': 0.0004965302099015175, 'samples': 1892928, 'steps': 9858, 'loss/train': 1.5586031675338745} +11/06/2021 22:37:04 - INFO - __main__ - Step 9860: {'lr': 0.0004965293287715464, 'samples': 1893120, 'steps': 9859, 'loss/train': 1.8850369453430176} +11/06/2021 22:37:04 - INFO - __main__ - Step 9861: {'lr': 0.0004965284475304931, 'samples': 1893312, 'steps': 9860, 'loss/train': 2.069514274597168} +11/06/2021 22:37:06 - INFO - __main__ - Step 9862: {'lr': 0.0004965275661783579, 'samples': 1893504, 'steps': 9861, 'loss/train': 2.3399882316589355} +11/06/2021 22:37:06 - INFO - __main__ - Step 9863: {'lr': 0.0004965266847151411, 'samples': 1893696, 'steps': 9862, 'loss/train': 1.8240324258804321} +11/06/2021 22:37:07 - INFO - __main__ - Step 9864: {'lr': 0.0004965258031408432, 'samples': 1893888, 'steps': 9863, 'loss/train': 1.4843631982803345} +11/06/2021 22:37:07 - INFO - __main__ - Step 9865: {'lr': 0.0004965249214554645, 'samples': 1894080, 'steps': 9864, 'loss/train': 1.9368473291397095} +11/06/2021 22:37:07 - INFO - __main__ - Step 9866: {'lr': 0.0004965240396590055, 'samples': 1894272, 'steps': 9865, 'loss/train': 1.9536662101745605} +11/06/2021 22:37:08 - INFO - __main__ - Step 9867: {'lr': 0.0004965231577514666, 'samples': 1894464, 'steps': 9866, 'loss/train': 2.018059253692627} +11/06/2021 22:37:08 - INFO - __main__ - Step 9868: {'lr': 0.0004965222757328482, 'samples': 1894656, 'steps': 9867, 'loss/train': 2.956916093826294} +11/06/2021 22:37:09 - INFO - __main__ - Step 9869: {'lr': 0.0004965213936031507, 'samples': 1894848, 'steps': 9868, 'loss/train': 2.127044677734375} +11/06/2021 22:37:09 - INFO - __main__ - Step 9870: {'lr': 0.0004965205113623744, 'samples': 1895040, 'steps': 9869, 'loss/train': 1.807254433631897} +11/06/2021 22:37:10 - INFO - __main__ - Step 9871: {'lr': 0.0004965196290105197, 'samples': 1895232, 'steps': 9870, 'loss/train': 1.9776854515075684} +11/06/2021 22:37:10 - INFO - __main__ - Step 9872: {'lr': 0.0004965187465475873, 'samples': 1895424, 'steps': 9871, 'loss/train': 1.997361660003662} +11/06/2021 22:37:11 - INFO - __main__ - Step 9873: {'lr': 0.0004965178639735772, 'samples': 1895616, 'steps': 9872, 'loss/train': 1.981247067451477} +11/06/2021 22:37:11 - INFO - __main__ - Step 9874: {'lr': 0.0004965169812884898, 'samples': 1895808, 'steps': 9873, 'loss/train': 1.2999768257141113} +11/06/2021 22:37:12 - INFO - __main__ - Step 9875: {'lr': 0.0004965160984923259, 'samples': 1896000, 'steps': 9874, 'loss/train': 2.367384433746338} +11/06/2021 22:37:12 - INFO - __main__ - Step 9876: {'lr': 0.0004965152155850855, 'samples': 1896192, 'steps': 9875, 'loss/train': 1.639930248260498} +11/06/2021 22:37:13 - INFO - __main__ - Step 9877: {'lr': 0.0004965143325667692, 'samples': 1896384, 'steps': 9876, 'loss/train': 2.1641268730163574} +11/06/2021 22:37:13 - INFO - __main__ - Step 9878: {'lr': 0.0004965134494373773, 'samples': 1896576, 'steps': 9877, 'loss/train': 1.5240188837051392} +11/06/2021 22:37:13 - INFO - __main__ - Step 9879: {'lr': 0.0004965125661969103, 'samples': 1896768, 'steps': 9878, 'loss/train': 1.7663499116897583} +11/06/2021 22:37:14 - INFO - __main__ - Step 9880: {'lr': 0.0004965116828453685, 'samples': 1896960, 'steps': 9879, 'loss/train': 1.9683094024658203} +11/06/2021 22:37:15 - INFO - __main__ - Step 9881: {'lr': 0.0004965107993827524, 'samples': 1897152, 'steps': 9880, 'loss/train': 1.8044612407684326} +11/06/2021 22:37:15 - INFO - __main__ - Step 9882: {'lr': 0.0004965099158090624, 'samples': 1897344, 'steps': 9881, 'loss/train': 1.7531816959381104} +11/06/2021 22:37:15 - INFO - __main__ - Step 9883: {'lr': 0.0004965090321242987, 'samples': 1897536, 'steps': 9882, 'loss/train': 1.9520115852355957} +11/06/2021 22:37:16 - INFO - __main__ - Step 9884: {'lr': 0.0004965081483284618, 'samples': 1897728, 'steps': 9883, 'loss/train': 2.066235065460205} +11/06/2021 22:37:17 - INFO - __main__ - Step 9885: {'lr': 0.0004965072644215522, 'samples': 1897920, 'steps': 9884, 'loss/train': 1.9941020011901855} +11/06/2021 22:37:17 - INFO - __main__ - Step 9886: {'lr': 0.0004965063804035703, 'samples': 1898112, 'steps': 9885, 'loss/train': 1.8429374694824219} +11/06/2021 22:37:17 - INFO - __main__ - Step 9887: {'lr': 0.0004965054962745163, 'samples': 1898304, 'steps': 9886, 'loss/train': 2.1564157009124756} +11/06/2021 22:37:18 - INFO - __main__ - Step 9888: {'lr': 0.0004965046120343908, 'samples': 1898496, 'steps': 9887, 'loss/train': 1.4476630687713623} +11/06/2021 22:37:18 - INFO - __main__ - Step 9889: {'lr': 0.0004965037276831942, 'samples': 1898688, 'steps': 9888, 'loss/train': 1.0114924907684326} +11/06/2021 22:37:19 - INFO - __main__ - Step 9890: {'lr': 0.0004965028432209267, 'samples': 1898880, 'steps': 9889, 'loss/train': 1.0621055364608765} +11/06/2021 22:37:19 - INFO - __main__ - Step 9891: {'lr': 0.0004965019586475888, 'samples': 1899072, 'steps': 9890, 'loss/train': 1.3111342191696167} +11/06/2021 22:37:20 - INFO - __main__ - Step 9892: {'lr': 0.000496501073963181, 'samples': 1899264, 'steps': 9891, 'loss/train': 1.5163756608963013} +11/06/2021 22:37:20 - INFO - __main__ - Step 9893: {'lr': 0.0004965001891677037, 'samples': 1899456, 'steps': 9892, 'loss/train': 1.4711591005325317} +11/06/2021 22:37:21 - INFO - __main__ - Step 9894: {'lr': 0.000496499304261157, 'samples': 1899648, 'steps': 9893, 'loss/train': 2.3137621879577637} +11/06/2021 22:37:22 - INFO - __main__ - Step 9895: {'lr': 0.0004964984192435417, 'samples': 1899840, 'steps': 9894, 'loss/train': 1.8023244142532349} +11/06/2021 22:37:22 - INFO - __main__ - Step 9896: {'lr': 0.000496497534114858, 'samples': 1900032, 'steps': 9895, 'loss/train': 1.5675020217895508} +11/06/2021 22:37:23 - INFO - __main__ - Step 9897: {'lr': 0.0004964966488751062, 'samples': 1900224, 'steps': 9896, 'loss/train': 1.4843635559082031} +11/06/2021 22:37:23 - INFO - __main__ - Step 9898: {'lr': 0.000496495763524287, 'samples': 1900416, 'steps': 9897, 'loss/train': 2.4118194580078125} +11/06/2021 22:37:24 - INFO - __main__ - Step 9899: {'lr': 0.0004964948780624005, 'samples': 1900608, 'steps': 9898, 'loss/train': 1.6140505075454712} +11/06/2021 22:37:24 - INFO - __main__ - Step 9900: {'lr': 0.0004964939924894472, 'samples': 1900800, 'steps': 9899, 'loss/train': 1.5659464597702026} +11/06/2021 22:37:24 - INFO - __main__ - Step 9901: {'lr': 0.0004964931068054274, 'samples': 1900992, 'steps': 9900, 'loss/train': 0.7185819149017334} +11/06/2021 22:37:25 - INFO - __main__ - Step 9902: {'lr': 0.0004964922210103418, 'samples': 1901184, 'steps': 9901, 'loss/train': 0.6721516251564026} +11/06/2021 22:37:26 - INFO - __main__ - Step 9903: {'lr': 0.0004964913351041905, 'samples': 1901376, 'steps': 9902, 'loss/train': 2.110550880432129} +11/06/2021 22:37:26 - INFO - __main__ - Step 9904: {'lr': 0.000496490449086974, 'samples': 1901568, 'steps': 9903, 'loss/train': 2.038620948791504} +11/06/2021 22:37:26 - INFO - __main__ - Step 9905: {'lr': 0.0004964895629586928, 'samples': 1901760, 'steps': 9904, 'loss/train': 2.2174274921417236} +11/06/2021 22:37:27 - INFO - __main__ - Step 9906: {'lr': 0.0004964886767193471, 'samples': 1901952, 'steps': 9905, 'loss/train': 1.2710689306259155} +11/06/2021 22:37:27 - INFO - __main__ - Step 9907: {'lr': 0.0004964877903689375, 'samples': 1902144, 'steps': 9906, 'loss/train': 1.9977413415908813} +11/06/2021 22:37:28 - INFO - __main__ - Step 9908: {'lr': 0.0004964869039074643, 'samples': 1902336, 'steps': 9907, 'loss/train': 1.3191601037979126} +11/06/2021 22:37:29 - INFO - __main__ - Step 9909: {'lr': 0.000496486017334928, 'samples': 1902528, 'steps': 9908, 'loss/train': 2.083883047103882} +11/06/2021 22:37:29 - INFO - __main__ - Step 9910: {'lr': 0.0004964851306513287, 'samples': 1902720, 'steps': 9909, 'loss/train': 0.8083091974258423} +11/06/2021 22:37:29 - INFO - __main__ - Step 9911: {'lr': 0.0004964842438566671, 'samples': 1902912, 'steps': 9910, 'loss/train': 1.8291444778442383} +11/06/2021 22:37:30 - INFO - __main__ - Step 9912: {'lr': 0.0004964833569509434, 'samples': 1903104, 'steps': 9911, 'loss/train': 1.752215027809143} +11/06/2021 22:37:31 - INFO - __main__ - Step 9913: {'lr': 0.0004964824699341582, 'samples': 1903296, 'steps': 9912, 'loss/train': 1.807940125465393} +11/06/2021 22:37:31 - INFO - __main__ - Step 9914: {'lr': 0.0004964815828063118, 'samples': 1903488, 'steps': 9913, 'loss/train': 1.4366697072982788} +11/06/2021 22:37:31 - INFO - __main__ - Step 9915: {'lr': 0.0004964806955674046, 'samples': 1903680, 'steps': 9914, 'loss/train': 2.080610752105713} +11/06/2021 22:37:32 - INFO - __main__ - Step 9916: {'lr': 0.0004964798082174371, 'samples': 1903872, 'steps': 9915, 'loss/train': 1.5181411504745483} +11/06/2021 22:37:32 - INFO - __main__ - Step 9917: {'lr': 0.0004964789207564094, 'samples': 1904064, 'steps': 9916, 'loss/train': 1.8686342239379883} +11/06/2021 22:37:33 - INFO - __main__ - Step 9918: {'lr': 0.0004964780331843223, 'samples': 1904256, 'steps': 9917, 'loss/train': 2.0889878273010254} +11/06/2021 22:37:33 - INFO - __main__ - Step 9919: {'lr': 0.0004964771455011758, 'samples': 1904448, 'steps': 9918, 'loss/train': 1.7543959617614746} +11/06/2021 22:37:34 - INFO - __main__ - Step 9920: {'lr': 0.0004964762577069707, 'samples': 1904640, 'steps': 9919, 'loss/train': 1.4055709838867188} +11/06/2021 22:37:34 - INFO - __main__ - Step 9921: {'lr': 0.0004964753698017071, 'samples': 1904832, 'steps': 9920, 'loss/train': 1.6933525800704956} +11/06/2021 22:37:34 - INFO - __main__ - Step 9922: {'lr': 0.0004964744817853855, 'samples': 1905024, 'steps': 9921, 'loss/train': 1.261832356452942} +11/06/2021 22:37:35 - INFO - __main__ - Step 9923: {'lr': 0.0004964735936580063, 'samples': 1905216, 'steps': 9922, 'loss/train': 2.1547069549560547} +11/06/2021 22:37:36 - INFO - __main__ - Step 9924: {'lr': 0.00049647270541957, 'samples': 1905408, 'steps': 9923, 'loss/train': 1.4039684534072876} +11/06/2021 22:37:36 - INFO - __main__ - Step 9925: {'lr': 0.0004964718170700767, 'samples': 1905600, 'steps': 9924, 'loss/train': 1.7743269205093384} +11/06/2021 22:37:37 - INFO - __main__ - Step 9926: {'lr': 0.0004964709286095271, 'samples': 1905792, 'steps': 9925, 'loss/train': 1.6846635341644287} +11/06/2021 22:37:37 - INFO - __main__ - Step 9927: {'lr': 0.0004964700400379215, 'samples': 1905984, 'steps': 9926, 'loss/train': 1.7219330072402954} +11/06/2021 22:37:37 - INFO - __main__ - Step 9928: {'lr': 0.0004964691513552604, 'samples': 1906176, 'steps': 9927, 'loss/train': 1.6441329717636108} +11/06/2021 22:37:38 - INFO - __main__ - Step 9929: {'lr': 0.000496468262561544, 'samples': 1906368, 'steps': 9928, 'loss/train': 1.6577142477035522} +11/06/2021 22:37:38 - INFO - __main__ - Step 9930: {'lr': 0.0004964673736567728, 'samples': 1906560, 'steps': 9929, 'loss/train': 1.7367271184921265} +11/06/2021 22:37:39 - INFO - __main__ - Step 9931: {'lr': 0.0004964664846409473, 'samples': 1906752, 'steps': 9930, 'loss/train': 1.7608524560928345} +11/06/2021 22:37:39 - INFO - __main__ - Step 9932: {'lr': 0.0004964655955140677, 'samples': 1906944, 'steps': 9931, 'loss/train': 1.8868800401687622} +11/06/2021 22:37:40 - INFO - __main__ - Step 9933: {'lr': 0.0004964647062761345, 'samples': 1907136, 'steps': 9932, 'loss/train': 2.024883270263672} +11/06/2021 22:37:41 - INFO - __main__ - Step 9934: {'lr': 0.0004964638169271482, 'samples': 1907328, 'steps': 9933, 'loss/train': 1.661513328552246} +11/06/2021 22:37:41 - INFO - __main__ - Step 9935: {'lr': 0.0004964629274671091, 'samples': 1907520, 'steps': 9934, 'loss/train': 1.6273504495620728} +11/06/2021 22:37:42 - INFO - __main__ - Step 9936: {'lr': 0.0004964620378960175, 'samples': 1907712, 'steps': 9935, 'loss/train': 1.556241750717163} +11/06/2021 22:37:42 - INFO - __main__ - Step 9937: {'lr': 0.000496461148213874, 'samples': 1907904, 'steps': 9936, 'loss/train': 2.6705877780914307} +11/06/2021 22:37:42 - INFO - __main__ - Step 9938: {'lr': 0.0004964602584206788, 'samples': 1908096, 'steps': 9937, 'loss/train': 1.8545628786087036} +11/06/2021 22:37:43 - INFO - __main__ - Step 9939: {'lr': 0.0004964593685164326, 'samples': 1908288, 'steps': 9938, 'loss/train': 1.645344614982605} +11/06/2021 22:37:44 - INFO - __main__ - Step 9940: {'lr': 0.0004964584785011355, 'samples': 1908480, 'steps': 9939, 'loss/train': 1.6063035726547241} +11/06/2021 22:37:44 - INFO - __main__ - Step 9941: {'lr': 0.000496457588374788, 'samples': 1908672, 'steps': 9940, 'loss/train': 0.9683166146278381} +11/06/2021 22:37:44 - INFO - __main__ - Step 9942: {'lr': 0.0004964566981373905, 'samples': 1908864, 'steps': 9941, 'loss/train': 1.5615383386611938} +11/06/2021 22:37:45 - INFO - __main__ - Step 9943: {'lr': 0.0004964558077889435, 'samples': 1909056, 'steps': 9942, 'loss/train': 1.4332380294799805} +11/06/2021 22:37:45 - INFO - __main__ - Step 9944: {'lr': 0.0004964549173294472, 'samples': 1909248, 'steps': 9943, 'loss/train': 1.4659695625305176} +11/06/2021 22:37:46 - INFO - __main__ - Step 9945: {'lr': 0.0004964540267589023, 'samples': 1909440, 'steps': 9944, 'loss/train': 1.1614114046096802} +11/06/2021 22:37:46 - INFO - __main__ - Step 9946: {'lr': 0.0004964531360773088, 'samples': 1909632, 'steps': 9945, 'loss/train': 1.5709928274154663} +11/06/2021 22:37:47 - INFO - __main__ - Step 9947: {'lr': 0.0004964522452846675, 'samples': 1909824, 'steps': 9946, 'loss/train': 1.8149683475494385} +11/06/2021 22:37:47 - INFO - __main__ - Step 9948: {'lr': 0.0004964513543809785, 'samples': 1910016, 'steps': 9947, 'loss/train': 1.0438923835754395} +11/06/2021 22:37:48 - INFO - __main__ - Step 9949: {'lr': 0.0004964504633662424, 'samples': 1910208, 'steps': 9948, 'loss/train': 0.8558833599090576} +11/06/2021 22:37:49 - INFO - __main__ - Step 9950: {'lr': 0.0004964495722404595, 'samples': 1910400, 'steps': 9949, 'loss/train': 1.9778287410736084} +11/06/2021 22:37:49 - INFO - __main__ - Step 9951: {'lr': 0.0004964486810036301, 'samples': 1910592, 'steps': 9950, 'loss/train': 2.1700186729431152} +11/06/2021 22:37:49 - INFO - __main__ - Step 9952: {'lr': 0.000496447789655755, 'samples': 1910784, 'steps': 9951, 'loss/train': 1.5003530979156494} +11/06/2021 22:37:50 - INFO - __main__ - Step 9953: {'lr': 0.0004964468981968341, 'samples': 1910976, 'steps': 9952, 'loss/train': 1.8400135040283203} +11/06/2021 22:37:50 - INFO - __main__ - Step 9954: {'lr': 0.0004964460066268681, 'samples': 1911168, 'steps': 9953, 'loss/train': 1.9778108596801758} +11/06/2021 22:37:51 - INFO - __main__ - Step 9955: {'lr': 0.0004964451149458573, 'samples': 1911360, 'steps': 9954, 'loss/train': 1.6574676036834717} +11/06/2021 22:37:51 - INFO - __main__ - Step 9956: {'lr': 0.0004964442231538023, 'samples': 1911552, 'steps': 9955, 'loss/train': 1.1613150835037231} +11/06/2021 22:37:52 - INFO - __main__ - Step 9957: {'lr': 0.000496443331250703, 'samples': 1911744, 'steps': 9956, 'loss/train': 1.88170325756073} +11/06/2021 22:37:52 - INFO - __main__ - Step 9958: {'lr': 0.0004964424392365604, 'samples': 1911936, 'steps': 9957, 'loss/train': 2.3807883262634277} +11/06/2021 22:37:52 - INFO - __main__ - Step 9959: {'lr': 0.0004964415471113747, 'samples': 1912128, 'steps': 9958, 'loss/train': 2.4166524410247803} +11/06/2021 22:37:53 - INFO - __main__ - Step 9960: {'lr': 0.0004964406548751461, 'samples': 1912320, 'steps': 9959, 'loss/train': 2.397183656692505} +11/06/2021 22:37:54 - INFO - __main__ - Step 9961: {'lr': 0.0004964397625278751, 'samples': 1912512, 'steps': 9960, 'loss/train': 1.7461156845092773} +11/06/2021 22:37:54 - INFO - __main__ - Step 9962: {'lr': 0.0004964388700695623, 'samples': 1912704, 'steps': 9961, 'loss/train': 1.654305100440979} +11/06/2021 22:37:55 - INFO - __main__ - Step 9963: {'lr': 0.0004964379775002078, 'samples': 1912896, 'steps': 9962, 'loss/train': 2.360861301422119} +11/06/2021 22:37:55 - INFO - __main__ - Step 9964: {'lr': 0.0004964370848198122, 'samples': 1913088, 'steps': 9963, 'loss/train': 2.1414263248443604} +11/06/2021 22:37:55 - INFO - __main__ - Step 9965: {'lr': 0.0004964361920283759, 'samples': 1913280, 'steps': 9964, 'loss/train': 1.4624086618423462} +11/06/2021 22:37:56 - INFO - __main__ - Step 9966: {'lr': 0.0004964352991258992, 'samples': 1913472, 'steps': 9965, 'loss/train': 1.942596435546875} +11/06/2021 22:37:57 - INFO - __main__ - Step 9967: {'lr': 0.0004964344061123826, 'samples': 1913664, 'steps': 9966, 'loss/train': 1.6361198425292969} +11/06/2021 22:37:57 - INFO - __main__ - Step 9968: {'lr': 0.0004964335129878264, 'samples': 1913856, 'steps': 9967, 'loss/train': 1.1940803527832031} +11/06/2021 22:37:57 - INFO - __main__ - Step 9969: {'lr': 0.0004964326197522311, 'samples': 1914048, 'steps': 9968, 'loss/train': 1.8905918598175049} +11/06/2021 22:37:58 - INFO - __main__ - Step 9970: {'lr': 0.0004964317264055971, 'samples': 1914240, 'steps': 9969, 'loss/train': 1.6931695938110352} +11/06/2021 22:37:59 - INFO - __main__ - Step 9971: {'lr': 0.0004964308329479247, 'samples': 1914432, 'steps': 9970, 'loss/train': 2.065845489501953} +11/06/2021 22:37:59 - INFO - __main__ - Step 9972: {'lr': 0.0004964299393792143, 'samples': 1914624, 'steps': 9971, 'loss/train': 2.043527603149414} +11/06/2021 22:37:59 - INFO - __main__ - Step 9973: {'lr': 0.0004964290456994666, 'samples': 1914816, 'steps': 9972, 'loss/train': 1.4954372644424438} +11/06/2021 22:38:00 - INFO - __main__ - Step 9974: {'lr': 0.0004964281519086816, 'samples': 1915008, 'steps': 9973, 'loss/train': 2.400644302368164} +11/06/2021 22:38:00 - INFO - __main__ - Step 9975: {'lr': 0.0004964272580068599, 'samples': 1915200, 'steps': 9974, 'loss/train': 1.6218897104263306} +11/06/2021 22:38:01 - INFO - __main__ - Step 9976: {'lr': 0.0004964263639940018, 'samples': 1915392, 'steps': 9975, 'loss/train': 2.0930655002593994} +11/06/2021 22:38:02 - INFO - __main__ - Step 9977: {'lr': 0.000496425469870108, 'samples': 1915584, 'steps': 9976, 'loss/train': 1.391600251197815} +11/06/2021 22:38:02 - INFO - __main__ - Step 9978: {'lr': 0.0004964245756351786, 'samples': 1915776, 'steps': 9977, 'loss/train': 1.8200713396072388} +11/06/2021 22:38:02 - INFO - __main__ - Step 9979: {'lr': 0.000496423681289214, 'samples': 1915968, 'steps': 9978, 'loss/train': 1.7776697874069214} +11/06/2021 22:38:03 - INFO - __main__ - Step 9980: {'lr': 0.0004964227868322148, 'samples': 1916160, 'steps': 9979, 'loss/train': 1.082550287246704} +11/06/2021 22:38:04 - INFO - __main__ - Step 9981: {'lr': 0.0004964218922641812, 'samples': 1916352, 'steps': 9980, 'loss/train': 1.5953223705291748} +11/06/2021 22:38:04 - INFO - __main__ - Step 9982: {'lr': 0.0004964209975851137, 'samples': 1916544, 'steps': 9981, 'loss/train': 1.3076783418655396} +11/06/2021 22:38:04 - INFO - __main__ - Step 9983: {'lr': 0.0004964201027950129, 'samples': 1916736, 'steps': 9982, 'loss/train': 1.7255864143371582} +11/06/2021 22:38:05 - INFO - __main__ - Step 9984: {'lr': 0.0004964192078938788, 'samples': 1916928, 'steps': 9983, 'loss/train': 2.1289093494415283} +11/06/2021 22:38:05 - INFO - __main__ - Step 9985: {'lr': 0.0004964183128817121, 'samples': 1917120, 'steps': 9984, 'loss/train': 1.9382929801940918} +11/06/2021 22:38:06 - INFO - __main__ - Step 9986: {'lr': 0.000496417417758513, 'samples': 1917312, 'steps': 9985, 'loss/train': 1.6477100849151611} +11/06/2021 22:38:06 - INFO - __main__ - Step 9987: {'lr': 0.000496416522524282, 'samples': 1917504, 'steps': 9986, 'loss/train': 1.6857631206512451} +11/06/2021 22:38:07 - INFO - __main__ - Step 9988: {'lr': 0.0004964156271790197, 'samples': 1917696, 'steps': 9987, 'loss/train': 1.4530490636825562} +11/06/2021 22:38:07 - INFO - __main__ - Step 9989: {'lr': 0.0004964147317227262, 'samples': 1917888, 'steps': 9988, 'loss/train': 1.7035175561904907} +11/06/2021 22:38:07 - INFO - __main__ - Step 9990: {'lr': 0.000496413836155402, 'samples': 1918080, 'steps': 9989, 'loss/train': 1.9417301416397095} +11/06/2021 22:38:09 - INFO - __main__ - Step 9991: {'lr': 0.0004964129404770476, 'samples': 1918272, 'steps': 9990, 'loss/train': 1.67684006690979} +11/06/2021 22:38:09 - INFO - __main__ - Step 9992: {'lr': 0.0004964120446876633, 'samples': 1918464, 'steps': 9991, 'loss/train': 1.8245000839233398} +11/06/2021 22:38:09 - INFO - __main__ - Step 9993: {'lr': 0.0004964111487872495, 'samples': 1918656, 'steps': 9992, 'loss/train': 1.7816718816757202} +11/06/2021 22:38:10 - INFO - __main__ - Step 9994: {'lr': 0.0004964102527758067, 'samples': 1918848, 'steps': 9993, 'loss/train': 1.7993488311767578} +11/06/2021 22:38:10 - INFO - __main__ - Step 9995: {'lr': 0.0004964093566533352, 'samples': 1919040, 'steps': 9994, 'loss/train': 1.1521903276443481} +11/06/2021 22:38:11 - INFO - __main__ - Step 9996: {'lr': 0.0004964084604198354, 'samples': 1919232, 'steps': 9995, 'loss/train': 1.9137816429138184} +11/06/2021 22:38:11 - INFO - __main__ - Step 9997: {'lr': 0.0004964075640753079, 'samples': 1919424, 'steps': 9996, 'loss/train': 1.5610769987106323} +11/06/2021 22:38:12 - INFO - __main__ - Step 9998: {'lr': 0.0004964066676197528, 'samples': 1919616, 'steps': 9997, 'loss/train': 1.6594487428665161} +11/06/2021 22:38:12 - INFO - __main__ - Step 9999: {'lr': 0.0004964057710531707, 'samples': 1919808, 'steps': 9998, 'loss/train': 1.531420111656189} +11/06/2021 22:38:12 - INFO - __main__ - Step 10000: {'lr': 0.0004964048743755621, 'samples': 1920000, 'steps': 9999, 'loss/train': 1.2586203813552856} +11/06/2021 22:38:13 - INFO - __main__ - Step 10001: {'lr': 0.0004964039775869272, 'samples': 1920192, 'steps': 10000, 'loss/train': 1.3523963689804077} +11/06/2021 22:38:14 - INFO - __main__ - Step 10002: {'lr': 0.0004964030806872664, 'samples': 1920384, 'steps': 10001, 'loss/train': 1.9878268241882324} +11/06/2021 22:38:14 - INFO - __main__ - Step 10003: {'lr': 0.0004964021836765802, 'samples': 1920576, 'steps': 10002, 'loss/train': 1.8906978368759155} +11/06/2021 22:38:14 - INFO - __main__ - Step 10004: {'lr': 0.000496401286554869, 'samples': 1920768, 'steps': 10003, 'loss/train': 1.310309648513794} +11/06/2021 22:38:15 - INFO - __main__ - Step 10005: {'lr': 0.000496400389322133, 'samples': 1920960, 'steps': 10004, 'loss/train': 1.6377642154693604} +11/06/2021 22:38:15 - INFO - __main__ - Step 10006: {'lr': 0.000496399491978373, 'samples': 1921152, 'steps': 10005, 'loss/train': 2.1881837844848633} +11/06/2021 22:38:16 - INFO - __main__ - Step 10007: {'lr': 0.0004963985945235891, 'samples': 1921344, 'steps': 10006, 'loss/train': 1.2533279657363892} +11/06/2021 22:38:16 - INFO - __main__ - Step 10008: {'lr': 0.0004963976969577819, 'samples': 1921536, 'steps': 10007, 'loss/train': 1.3222609758377075} +11/06/2021 22:38:17 - INFO - __main__ - Step 10009: {'lr': 0.0004963967992809516, 'samples': 1921728, 'steps': 10008, 'loss/train': 1.7431193590164185} +11/06/2021 22:38:17 - INFO - __main__ - Step 10010: {'lr': 0.0004963959014930988, 'samples': 1921920, 'steps': 10009, 'loss/train': 2.0606842041015625} +11/06/2021 22:38:17 - INFO - __main__ - Step 10011: {'lr': 0.0004963950035942237, 'samples': 1922112, 'steps': 10010, 'loss/train': 1.9937307834625244} +11/06/2021 22:38:19 - INFO - __main__ - Step 10012: {'lr': 0.0004963941055843268, 'samples': 1922304, 'steps': 10011, 'loss/train': 1.7773168087005615} +11/06/2021 22:38:19 - INFO - __main__ - Step 10013: {'lr': 0.0004963932074634087, 'samples': 1922496, 'steps': 10012, 'loss/train': 1.3404390811920166} +11/06/2021 22:38:19 - INFO - __main__ - Step 10014: {'lr': 0.0004963923092314694, 'samples': 1922688, 'steps': 10013, 'loss/train': 1.3710219860076904} +11/06/2021 22:38:20 - INFO - __main__ - Step 10015: {'lr': 0.0004963914108885097, 'samples': 1922880, 'steps': 10014, 'loss/train': 1.7717443704605103} +11/06/2021 22:38:20 - INFO - __main__ - Step 10016: {'lr': 0.0004963905124345297, 'samples': 1923072, 'steps': 10015, 'loss/train': 1.6650587320327759} +11/06/2021 22:38:21 - INFO - __main__ - Step 10017: {'lr': 0.00049638961386953, 'samples': 1923264, 'steps': 10016, 'loss/train': 1.4850966930389404} +11/06/2021 22:38:21 - INFO - __main__ - Step 10018: {'lr': 0.000496388715193511, 'samples': 1923456, 'steps': 10017, 'loss/train': 1.0550109148025513} +11/06/2021 22:38:22 - INFO - __main__ - Step 10019: {'lr': 0.000496387816406473, 'samples': 1923648, 'steps': 10018, 'loss/train': 1.6358630657196045} +11/06/2021 22:38:22 - INFO - __main__ - Step 10020: {'lr': 0.0004963869175084164, 'samples': 1923840, 'steps': 10019, 'loss/train': 1.7765165567398071} +11/06/2021 22:38:22 - INFO - __main__ - Step 10021: {'lr': 0.0004963860184993416, 'samples': 1924032, 'steps': 10020, 'loss/train': 1.717958688735962} +11/06/2021 22:38:23 - INFO - __main__ - Step 10022: {'lr': 0.0004963851193792492, 'samples': 1924224, 'steps': 10021, 'loss/train': 1.7283834218978882} +11/06/2021 22:38:24 - INFO - __main__ - Step 10023: {'lr': 0.0004963842201481394, 'samples': 1924416, 'steps': 10022, 'loss/train': 1.514644742012024} +11/06/2021 22:38:24 - INFO - __main__ - Step 10024: {'lr': 0.0004963833208060128, 'samples': 1924608, 'steps': 10023, 'loss/train': 1.3506485223770142} +11/06/2021 22:38:24 - INFO - __main__ - Step 10025: {'lr': 0.0004963824213528696, 'samples': 1924800, 'steps': 10024, 'loss/train': 1.9384859800338745} +11/06/2021 22:38:25 - INFO - __main__ - Step 10026: {'lr': 0.0004963815217887102, 'samples': 1924992, 'steps': 10025, 'loss/train': 2.230543851852417} +11/06/2021 22:38:26 - INFO - __main__ - Step 10027: {'lr': 0.0004963806221135351, 'samples': 1925184, 'steps': 10026, 'loss/train': 1.5828680992126465} +11/06/2021 22:38:26 - INFO - __main__ - Step 10028: {'lr': 0.0004963797223273448, 'samples': 1925376, 'steps': 10027, 'loss/train': 2.0957136154174805} +11/06/2021 22:38:27 - INFO - __main__ - Step 10029: {'lr': 0.0004963788224301395, 'samples': 1925568, 'steps': 10028, 'loss/train': 2.020629405975342} +11/06/2021 22:38:27 - INFO - __main__ - Step 10030: {'lr': 0.0004963779224219197, 'samples': 1925760, 'steps': 10029, 'loss/train': 1.7997504472732544} +11/06/2021 22:38:27 - INFO - __main__ - Step 10031: {'lr': 0.0004963770223026858, 'samples': 1925952, 'steps': 10030, 'loss/train': 1.9878836870193481} +11/06/2021 22:38:28 - INFO - __main__ - Step 10032: {'lr': 0.0004963761220724384, 'samples': 1926144, 'steps': 10031, 'loss/train': 1.9155443906784058} +11/06/2021 22:38:29 - INFO - __main__ - Step 10033: {'lr': 0.0004963752217311775, 'samples': 1926336, 'steps': 10032, 'loss/train': 1.7525060176849365} +11/06/2021 22:38:29 - INFO - __main__ - Step 10034: {'lr': 0.0004963743212789038, 'samples': 1926528, 'steps': 10033, 'loss/train': 2.0401864051818848} +11/06/2021 22:38:29 - INFO - __main__ - Step 10035: {'lr': 0.0004963734207156178, 'samples': 1926720, 'steps': 10034, 'loss/train': 1.524163007736206} +11/06/2021 22:38:30 - INFO - __main__ - Step 10036: {'lr': 0.0004963725200413195, 'samples': 1926912, 'steps': 10035, 'loss/train': 1.768740177154541} +11/06/2021 22:38:30 - INFO - __main__ - Step 10037: {'lr': 0.0004963716192560097, 'samples': 1927104, 'steps': 10036, 'loss/train': 0.7059550285339355} +11/06/2021 22:38:31 - INFO - __main__ - Step 10038: {'lr': 0.0004963707183596885, 'samples': 1927296, 'steps': 10037, 'loss/train': 1.979498267173767} +11/06/2021 22:38:32 - INFO - __main__ - Step 10039: {'lr': 0.0004963698173523566, 'samples': 1927488, 'steps': 10038, 'loss/train': 1.3461339473724365} +11/06/2021 22:38:32 - INFO - __main__ - Step 10040: {'lr': 0.0004963689162340142, 'samples': 1927680, 'steps': 10039, 'loss/train': 1.8551632165908813} +11/06/2021 22:38:32 - INFO - __main__ - Step 10041: {'lr': 0.0004963680150046618, 'samples': 1927872, 'steps': 10040, 'loss/train': 1.8479679822921753} +11/06/2021 22:38:33 - INFO - __main__ - Step 10042: {'lr': 0.0004963671136642997, 'samples': 1928064, 'steps': 10041, 'loss/train': 1.8179422616958618} +11/06/2021 22:38:34 - INFO - __main__ - Step 10043: {'lr': 0.0004963662122129284, 'samples': 1928256, 'steps': 10042, 'loss/train': 1.5947130918502808} +11/06/2021 22:38:34 - INFO - __main__ - Step 10044: {'lr': 0.0004963653106505483, 'samples': 1928448, 'steps': 10043, 'loss/train': 2.2334413528442383} +11/06/2021 22:38:34 - INFO - __main__ - Step 10045: {'lr': 0.0004963644089771598, 'samples': 1928640, 'steps': 10044, 'loss/train': 1.9353092908859253} +11/06/2021 22:38:35 - INFO - __main__ - Step 10046: {'lr': 0.0004963635071927633, 'samples': 1928832, 'steps': 10045, 'loss/train': 1.261295199394226} +11/06/2021 22:38:35 - INFO - __main__ - Step 10047: {'lr': 0.0004963626052973592, 'samples': 1929024, 'steps': 10046, 'loss/train': 1.8938654661178589} +11/06/2021 22:38:36 - INFO - __main__ - Step 10048: {'lr': 0.0004963617032909479, 'samples': 1929216, 'steps': 10047, 'loss/train': 1.5131046772003174} +11/06/2021 22:38:36 - INFO - __main__ - Step 10049: {'lr': 0.0004963608011735298, 'samples': 1929408, 'steps': 10048, 'loss/train': 1.5676438808441162} +11/06/2021 22:38:37 - INFO - __main__ - Step 10050: {'lr': 0.0004963598989451053, 'samples': 1929600, 'steps': 10049, 'loss/train': 1.8830301761627197} +11/06/2021 22:38:37 - INFO - __main__ - Step 10051: {'lr': 0.000496358996605675, 'samples': 1929792, 'steps': 10050, 'loss/train': 1.9643739461898804} +11/06/2021 22:38:37 - INFO - __main__ - Step 10052: {'lr': 0.0004963580941552391, 'samples': 1929984, 'steps': 10051, 'loss/train': 1.7612366676330566} +11/06/2021 22:38:38 - INFO - __main__ - Step 10053: {'lr': 0.0004963571915937979, 'samples': 1930176, 'steps': 10052, 'loss/train': 1.8770025968551636} +11/06/2021 22:38:39 - INFO - __main__ - Step 10054: {'lr': 0.000496356288921352, 'samples': 1930368, 'steps': 10053, 'loss/train': 1.7088673114776611} +11/06/2021 22:38:39 - INFO - __main__ - Step 10055: {'lr': 0.0004963553861379018, 'samples': 1930560, 'steps': 10054, 'loss/train': 2.023212194442749} +11/06/2021 22:38:39 - INFO - __main__ - Step 10056: {'lr': 0.0004963544832434476, 'samples': 1930752, 'steps': 10055, 'loss/train': 1.9566535949707031} +11/06/2021 22:38:40 - INFO - __main__ - Step 10057: {'lr': 0.00049635358023799, 'samples': 1930944, 'steps': 10056, 'loss/train': 1.7718608379364014} +11/06/2021 22:38:41 - INFO - __main__ - Step 10058: {'lr': 0.0004963526771215291, 'samples': 1931136, 'steps': 10057, 'loss/train': 1.9035671949386597} +11/06/2021 22:38:41 - INFO - __main__ - Step 10059: {'lr': 0.0004963517738940656, 'samples': 1931328, 'steps': 10058, 'loss/train': 1.7526215314865112} +11/06/2021 22:38:41 - INFO - __main__ - Step 10060: {'lr': 0.0004963508705555998, 'samples': 1931520, 'steps': 10059, 'loss/train': 1.9995636940002441} +11/06/2021 22:38:42 - INFO - __main__ - Step 10061: {'lr': 0.000496349967106132, 'samples': 1931712, 'steps': 10060, 'loss/train': 1.6497392654418945} +11/06/2021 22:38:42 - INFO - __main__ - Step 10062: {'lr': 0.0004963490635456629, 'samples': 1931904, 'steps': 10061, 'loss/train': 1.680986762046814} +11/06/2021 22:38:42 - INFO - __main__ - Step 10063: {'lr': 0.0004963481598741925, 'samples': 1932096, 'steps': 10062, 'loss/train': 1.8724141120910645} +11/06/2021 22:38:43 - INFO - __main__ - Step 10064: {'lr': 0.0004963472560917216, 'samples': 1932288, 'steps': 10063, 'loss/train': 1.6809192895889282} +11/06/2021 22:38:44 - INFO - __main__ - Step 10065: {'lr': 0.0004963463521982503, 'samples': 1932480, 'steps': 10064, 'loss/train': 1.8800909519195557} +11/06/2021 22:38:44 - INFO - __main__ - Step 10066: {'lr': 0.0004963454481937791, 'samples': 1932672, 'steps': 10065, 'loss/train': 1.9918426275253296} +11/06/2021 22:38:45 - INFO - __main__ - Step 10067: {'lr': 0.0004963445440783086, 'samples': 1932864, 'steps': 10066, 'loss/train': 1.8763664960861206} +11/06/2021 22:38:45 - INFO - __main__ - Step 10068: {'lr': 0.0004963436398518389, 'samples': 1933056, 'steps': 10067, 'loss/train': 1.3873255252838135} +11/06/2021 22:38:46 - INFO - __main__ - Step 10069: {'lr': 0.0004963427355143706, 'samples': 1933248, 'steps': 10068, 'loss/train': 1.4686658382415771} +11/06/2021 22:38:46 - INFO - __main__ - Step 10070: {'lr': 0.0004963418310659041, 'samples': 1933440, 'steps': 10069, 'loss/train': 1.890317440032959} +11/06/2021 22:38:47 - INFO - __main__ - Step 10071: {'lr': 0.0004963409265064398, 'samples': 1933632, 'steps': 10070, 'loss/train': 1.8712046146392822} +11/06/2021 22:38:47 - INFO - __main__ - Step 10072: {'lr': 0.0004963400218359781, 'samples': 1933824, 'steps': 10071, 'loss/train': 1.9994356632232666} +11/06/2021 22:38:47 - INFO - __main__ - Step 10073: {'lr': 0.0004963391170545193, 'samples': 1934016, 'steps': 10072, 'loss/train': 1.4278088808059692} +11/06/2021 22:38:48 - INFO - __main__ - Step 10074: {'lr': 0.0004963382121620639, 'samples': 1934208, 'steps': 10073, 'loss/train': 1.821343183517456} +11/06/2021 22:38:49 - INFO - __main__ - Step 10075: {'lr': 0.0004963373071586123, 'samples': 1934400, 'steps': 10074, 'loss/train': 2.091646909713745} +11/06/2021 22:38:49 - INFO - __main__ - Step 10076: {'lr': 0.000496336402044165, 'samples': 1934592, 'steps': 10075, 'loss/train': 1.838132619857788} +11/06/2021 22:38:49 - INFO - __main__ - Step 10077: {'lr': 0.0004963354968187222, 'samples': 1934784, 'steps': 10076, 'loss/train': 1.6847151517868042} +11/06/2021 22:38:50 - INFO - __main__ - Step 10078: {'lr': 0.0004963345914822845, 'samples': 1934976, 'steps': 10077, 'loss/train': 1.5948516130447388} +11/06/2021 22:38:51 - INFO - __main__ - Step 10079: {'lr': 0.0004963336860348521, 'samples': 1935168, 'steps': 10078, 'loss/train': 1.8252551555633545} +11/06/2021 22:38:51 - INFO - __main__ - Step 10080: {'lr': 0.0004963327804764257, 'samples': 1935360, 'steps': 10079, 'loss/train': 1.9088850021362305} +11/06/2021 22:38:52 - INFO - __main__ - Step 10081: {'lr': 0.0004963318748070056, 'samples': 1935552, 'steps': 10080, 'loss/train': 1.7089757919311523} +11/06/2021 22:38:52 - INFO - __main__ - Step 10082: {'lr': 0.0004963309690265921, 'samples': 1935744, 'steps': 10081, 'loss/train': 1.9372551441192627} +11/06/2021 22:38:52 - INFO - __main__ - Step 10083: {'lr': 0.0004963300631351856, 'samples': 1935936, 'steps': 10082, 'loss/train': 1.6880172491073608} +11/06/2021 22:38:53 - INFO - __main__ - Step 10084: {'lr': 0.0004963291571327866, 'samples': 1936128, 'steps': 10083, 'loss/train': 1.8040343523025513} +11/06/2021 22:38:54 - INFO - __main__ - Step 10085: {'lr': 0.0004963282510193955, 'samples': 1936320, 'steps': 10084, 'loss/train': 1.7773646116256714} +11/06/2021 22:38:54 - INFO - __main__ - Step 10086: {'lr': 0.0004963273447950126, 'samples': 1936512, 'steps': 10085, 'loss/train': 1.7499951124191284} +11/06/2021 22:38:54 - INFO - __main__ - Step 10087: {'lr': 0.0004963264384596386, 'samples': 1936704, 'steps': 10086, 'loss/train': 1.3979496955871582} +11/06/2021 22:38:55 - INFO - __main__ - Step 10088: {'lr': 0.0004963255320132735, 'samples': 1936896, 'steps': 10087, 'loss/train': 2.1118416786193848} +11/06/2021 22:38:55 - INFO - __main__ - Step 10089: {'lr': 0.0004963246254559181, 'samples': 1937088, 'steps': 10088, 'loss/train': 1.7357311248779297} +11/06/2021 22:38:56 - INFO - __main__ - Step 10090: {'lr': 0.0004963237187875724, 'samples': 1937280, 'steps': 10089, 'loss/train': 1.6976773738861084} +11/06/2021 22:38:56 - INFO - __main__ - Step 10091: {'lr': 0.0004963228120082372, 'samples': 1937472, 'steps': 10090, 'loss/train': 2.041823148727417} +11/06/2021 22:38:57 - INFO - __main__ - Step 10092: {'lr': 0.0004963219051179127, 'samples': 1937664, 'steps': 10091, 'loss/train': 1.77364182472229} +11/06/2021 22:38:57 - INFO - __main__ - Step 10093: {'lr': 0.0004963209981165993, 'samples': 1937856, 'steps': 10092, 'loss/train': 2.122255802154541} +11/06/2021 22:38:57 - INFO - __main__ - Step 10094: {'lr': 0.0004963200910042976, 'samples': 1938048, 'steps': 10093, 'loss/train': 1.8102829456329346} +11/06/2021 22:38:59 - INFO - __main__ - Step 10095: {'lr': 0.0004963191837810077, 'samples': 1938240, 'steps': 10094, 'loss/train': 1.7681382894515991} +11/06/2021 22:38:59 - INFO - __main__ - Step 10096: {'lr': 0.0004963182764467303, 'samples': 1938432, 'steps': 10095, 'loss/train': 1.8665366172790527} +11/06/2021 22:38:59 - INFO - __main__ - Step 10097: {'lr': 0.0004963173690014656, 'samples': 1938624, 'steps': 10096, 'loss/train': 2.1923022270202637} +11/06/2021 22:39:00 - INFO - __main__ - Step 10098: {'lr': 0.0004963164614452142, 'samples': 1938816, 'steps': 10097, 'loss/train': 1.7837992906570435} +11/06/2021 22:39:00 - INFO - __main__ - Step 10099: {'lr': 0.0004963155537779764, 'samples': 1939008, 'steps': 10098, 'loss/train': 1.7613967657089233} +11/06/2021 22:39:01 - INFO - __main__ - Step 10100: {'lr': 0.0004963146459997525, 'samples': 1939200, 'steps': 10099, 'loss/train': 0.7903871536254883} +11/06/2021 22:39:01 - INFO - __main__ - Step 10101: {'lr': 0.0004963137381105431, 'samples': 1939392, 'steps': 10100, 'loss/train': 2.0459229946136475} +11/06/2021 22:39:02 - INFO - __main__ - Step 10102: {'lr': 0.0004963128301103485, 'samples': 1939584, 'steps': 10101, 'loss/train': 1.6579885482788086} +11/06/2021 22:39:02 - INFO - __main__ - Step 10103: {'lr': 0.0004963119219991691, 'samples': 1939776, 'steps': 10102, 'loss/train': 1.9690332412719727} +11/06/2021 22:39:02 - INFO - __main__ - Step 10104: {'lr': 0.0004963110137770054, 'samples': 1939968, 'steps': 10103, 'loss/train': 1.717148780822754} +11/06/2021 22:39:04 - INFO - __main__ - Step 10105: {'lr': 0.0004963101054438578, 'samples': 1940160, 'steps': 10104, 'loss/train': 2.5613667964935303} +11/06/2021 22:39:04 - INFO - __main__ - Step 10106: {'lr': 0.0004963091969997265, 'samples': 1940352, 'steps': 10105, 'loss/train': 1.79701566696167} +11/06/2021 22:39:05 - INFO - __main__ - Step 10107: {'lr': 0.0004963082884446123, 'samples': 1940544, 'steps': 10106, 'loss/train': 1.8763283491134644} +11/06/2021 22:39:05 - INFO - __main__ - Step 10108: {'lr': 0.0004963073797785153, 'samples': 1940736, 'steps': 10107, 'loss/train': 1.9007415771484375} +11/06/2021 22:39:06 - INFO - __main__ - Step 10109: {'lr': 0.000496306471001436, 'samples': 1940928, 'steps': 10108, 'loss/train': 0.9993707537651062} +11/06/2021 22:39:06 - INFO - __main__ - Step 10110: {'lr': 0.0004963055621133748, 'samples': 1941120, 'steps': 10109, 'loss/train': 1.6748651266098022} +11/06/2021 22:39:06 - INFO - __main__ - Step 10111: {'lr': 0.0004963046531143321, 'samples': 1941312, 'steps': 10110, 'loss/train': 1.998529076576233} +11/06/2021 22:39:07 - INFO - __main__ - Step 10112: {'lr': 0.0004963037440043083, 'samples': 1941504, 'steps': 10111, 'loss/train': 1.8323516845703125} +11/06/2021 22:39:08 - INFO - __main__ - Step 10113: {'lr': 0.0004963028347833038, 'samples': 1941696, 'steps': 10112, 'loss/train': 2.443237066268921} +11/06/2021 22:39:08 - INFO - __main__ - Step 10114: {'lr': 0.0004963019254513191, 'samples': 1941888, 'steps': 10113, 'loss/train': 1.495759129524231} +11/06/2021 22:39:08 - INFO - __main__ - Step 10115: {'lr': 0.0004963010160083546, 'samples': 1942080, 'steps': 10114, 'loss/train': 1.9651312828063965} +11/06/2021 22:39:09 - INFO - __main__ - Step 10116: {'lr': 0.0004963001064544106, 'samples': 1942272, 'steps': 10115, 'loss/train': 1.4049568176269531} +11/06/2021 22:39:10 - INFO - __main__ - Step 10117: {'lr': 0.0004962991967894876, 'samples': 1942464, 'steps': 10116, 'loss/train': 1.3363804817199707} +11/06/2021 22:39:10 - INFO - __main__ - Step 10118: {'lr': 0.0004962982870135859, 'samples': 1942656, 'steps': 10117, 'loss/train': 1.6501933336257935} +11/06/2021 22:39:11 - INFO - __main__ - Step 10119: {'lr': 0.0004962973771267061, 'samples': 1942848, 'steps': 10118, 'loss/train': 1.7426259517669678} +11/06/2021 22:39:11 - INFO - __main__ - Step 10120: {'lr': 0.0004962964671288484, 'samples': 1943040, 'steps': 10119, 'loss/train': 1.8889999389648438} +11/06/2021 22:39:11 - INFO - __main__ - Step 10121: {'lr': 0.0004962955570200135, 'samples': 1943232, 'steps': 10120, 'loss/train': 1.7648907899856567} +11/06/2021 22:39:12 - INFO - __main__ - Step 10122: {'lr': 0.0004962946468002014, 'samples': 1943424, 'steps': 10121, 'loss/train': 2.164283514022827} +11/06/2021 22:39:13 - INFO - __main__ - Step 10123: {'lr': 0.0004962937364694129, 'samples': 1943616, 'steps': 10122, 'loss/train': 2.0995631217956543} +11/06/2021 22:39:13 - INFO - __main__ - Step 10124: {'lr': 0.0004962928260276481, 'samples': 1943808, 'steps': 10123, 'loss/train': 0.9570446014404297} +11/06/2021 22:39:13 - INFO - __main__ - Step 10125: {'lr': 0.0004962919154749077, 'samples': 1944000, 'steps': 10124, 'loss/train': 1.9521758556365967} +11/06/2021 22:39:14 - INFO - __main__ - Step 10126: {'lr': 0.0004962910048111919, 'samples': 1944192, 'steps': 10125, 'loss/train': 1.8387959003448486} +11/06/2021 22:39:14 - INFO - __main__ - Step 10127: {'lr': 0.0004962900940365012, 'samples': 1944384, 'steps': 10126, 'loss/train': 1.178709864616394} +11/06/2021 22:39:15 - INFO - __main__ - Step 10128: {'lr': 0.0004962891831508359, 'samples': 1944576, 'steps': 10127, 'loss/train': 1.920640230178833} +11/06/2021 22:39:15 - INFO - __main__ - Step 10129: {'lr': 0.0004962882721541965, 'samples': 1944768, 'steps': 10128, 'loss/train': 1.703497290611267} +11/06/2021 22:39:16 - INFO - __main__ - Step 10130: {'lr': 0.0004962873610465835, 'samples': 1944960, 'steps': 10129, 'loss/train': 1.4937912225723267} +11/06/2021 22:39:16 - INFO - __main__ - Step 10131: {'lr': 0.0004962864498279972, 'samples': 1945152, 'steps': 10130, 'loss/train': 1.5674489736557007} +11/06/2021 22:39:17 - INFO - __main__ - Step 10132: {'lr': 0.000496285538498438, 'samples': 1945344, 'steps': 10131, 'loss/train': 1.649821162223816} +11/06/2021 22:39:18 - INFO - __main__ - Step 10133: {'lr': 0.0004962846270579062, 'samples': 1945536, 'steps': 10132, 'loss/train': 1.809035062789917} +11/06/2021 22:39:18 - INFO - __main__ - Step 10134: {'lr': 0.0004962837155064025, 'samples': 1945728, 'steps': 10133, 'loss/train': 1.8651890754699707} +11/06/2021 22:39:18 - INFO - __main__ - Step 10135: {'lr': 0.0004962828038439272, 'samples': 1945920, 'steps': 10134, 'loss/train': 1.8161650896072388} +11/06/2021 22:39:19 - INFO - __main__ - Step 10136: {'lr': 0.0004962818920704805, 'samples': 1946112, 'steps': 10135, 'loss/train': 2.1492648124694824} +11/06/2021 22:39:19 - INFO - __main__ - Step 10137: {'lr': 0.0004962809801860632, 'samples': 1946304, 'steps': 10136, 'loss/train': 1.2017062902450562} +11/06/2021 22:39:20 - INFO - __main__ - Step 10138: {'lr': 0.0004962800681906753, 'samples': 1946496, 'steps': 10137, 'loss/train': 1.8302303552627563} +11/06/2021 22:39:20 - INFO - __main__ - Step 10139: {'lr': 0.0004962791560843175, 'samples': 1946688, 'steps': 10138, 'loss/train': 1.9001319408416748} +11/06/2021 22:39:21 - INFO - __main__ - Step 10140: {'lr': 0.00049627824386699, 'samples': 1946880, 'steps': 10139, 'loss/train': 1.766602873802185} +11/06/2021 22:39:21 - INFO - __main__ - Step 10141: {'lr': 0.0004962773315386935, 'samples': 1947072, 'steps': 10140, 'loss/train': 2.360720157623291} +11/06/2021 22:39:21 - INFO - __main__ - Step 10142: {'lr': 0.0004962764190994282, 'samples': 1947264, 'steps': 10141, 'loss/train': 1.9311211109161377} +11/06/2021 22:39:22 - INFO - __main__ - Step 10143: {'lr': 0.0004962755065491944, 'samples': 1947456, 'steps': 10142, 'loss/train': 1.6629748344421387} +11/06/2021 22:39:23 - INFO - __main__ - Step 10144: {'lr': 0.0004962745938879928, 'samples': 1947648, 'steps': 10143, 'loss/train': 2.1842613220214844} +11/06/2021 22:39:23 - INFO - __main__ - Step 10145: {'lr': 0.0004962736811158236, 'samples': 1947840, 'steps': 10144, 'loss/train': 1.8755285739898682} +11/06/2021 22:39:23 - INFO - __main__ - Step 10146: {'lr': 0.0004962727682326873, 'samples': 1948032, 'steps': 10145, 'loss/train': 1.2577018737792969} +11/06/2021 22:39:24 - INFO - __main__ - Step 10147: {'lr': 0.0004962718552385843, 'samples': 1948224, 'steps': 10146, 'loss/train': 1.5316803455352783} +11/06/2021 22:39:25 - INFO - __main__ - Step 10148: {'lr': 0.000496270942133515, 'samples': 1948416, 'steps': 10147, 'loss/train': 2.5291173458099365} +11/06/2021 22:39:25 - INFO - __main__ - Step 10149: {'lr': 0.0004962700289174798, 'samples': 1948608, 'steps': 10148, 'loss/train': 1.7601622343063354} +11/06/2021 22:39:26 - INFO - __main__ - Step 10150: {'lr': 0.0004962691155904791, 'samples': 1948800, 'steps': 10149, 'loss/train': 1.9934760332107544} +11/06/2021 22:39:26 - INFO - __main__ - Step 10151: {'lr': 0.0004962682021525134, 'samples': 1948992, 'steps': 10150, 'loss/train': 1.820966124534607} +11/06/2021 22:39:26 - INFO - __main__ - Step 10152: {'lr': 0.000496267288603583, 'samples': 1949184, 'steps': 10151, 'loss/train': 1.7241519689559937} +11/06/2021 22:39:27 - INFO - __main__ - Step 10153: {'lr': 0.0004962663749436883, 'samples': 1949376, 'steps': 10152, 'loss/train': 1.250434160232544} +11/06/2021 22:39:28 - INFO - __main__ - Step 10154: {'lr': 0.0004962654611728299, 'samples': 1949568, 'steps': 10153, 'loss/train': 1.601660966873169} +11/06/2021 22:39:28 - INFO - __main__ - Step 10155: {'lr': 0.000496264547291008, 'samples': 1949760, 'steps': 10154, 'loss/train': 1.6472324132919312} +11/06/2021 22:39:28 - INFO - __main__ - Step 10156: {'lr': 0.0004962636332982232, 'samples': 1949952, 'steps': 10155, 'loss/train': 0.9378107786178589} +11/06/2021 22:39:29 - INFO - __main__ - Step 10157: {'lr': 0.0004962627191944756, 'samples': 1950144, 'steps': 10156, 'loss/train': 1.7389650344848633} +11/06/2021 22:39:29 - INFO - __main__ - Step 10158: {'lr': 0.000496261804979766, 'samples': 1950336, 'steps': 10157, 'loss/train': 1.7131973505020142} +11/06/2021 22:39:30 - INFO - __main__ - Step 10159: {'lr': 0.0004962608906540946, 'samples': 1950528, 'steps': 10158, 'loss/train': 1.5908807516098022} +11/06/2021 22:39:30 - INFO - __main__ - Step 10160: {'lr': 0.0004962599762174618, 'samples': 1950720, 'steps': 10159, 'loss/train': 1.8197942972183228} +11/06/2021 22:39:31 - INFO - __main__ - Step 10161: {'lr': 0.0004962590616698681, 'samples': 1950912, 'steps': 10160, 'loss/train': 1.3586111068725586} +11/06/2021 22:39:31 - INFO - __main__ - Step 10162: {'lr': 0.0004962581470113138, 'samples': 1951104, 'steps': 10161, 'loss/train': 1.4758445024490356} +11/06/2021 22:39:31 - INFO - __main__ - Step 10163: {'lr': 0.0004962572322417994, 'samples': 1951296, 'steps': 10162, 'loss/train': 2.033109426498413} +11/06/2021 22:39:33 - INFO - __main__ - Step 10164: {'lr': 0.0004962563173613254, 'samples': 1951488, 'steps': 10163, 'loss/train': 2.092374324798584} +11/06/2021 22:39:33 - INFO - __main__ - Step 10165: {'lr': 0.000496255402369892, 'samples': 1951680, 'steps': 10164, 'loss/train': 1.1480693817138672} +11/06/2021 22:39:33 - INFO - __main__ - Step 10166: {'lr': 0.0004962544872674997, 'samples': 1951872, 'steps': 10165, 'loss/train': 1.6419637203216553} +11/06/2021 22:39:34 - INFO - __main__ - Step 10167: {'lr': 0.000496253572054149, 'samples': 1952064, 'steps': 10166, 'loss/train': 2.001441240310669} +11/06/2021 22:39:34 - INFO - __main__ - Step 10168: {'lr': 0.0004962526567298402, 'samples': 1952256, 'steps': 10167, 'loss/train': 0.8515803217887878} +11/06/2021 22:39:35 - INFO - __main__ - Step 10169: {'lr': 0.0004962517412945738, 'samples': 1952448, 'steps': 10168, 'loss/train': 1.8724167346954346} +11/06/2021 22:39:35 - INFO - __main__ - Step 10170: {'lr': 0.00049625082574835, 'samples': 1952640, 'steps': 10169, 'loss/train': 1.8901619911193848} +11/06/2021 22:39:36 - INFO - __main__ - Step 10171: {'lr': 0.0004962499100911696, 'samples': 1952832, 'steps': 10170, 'loss/train': 1.726631999015808} +11/06/2021 22:39:36 - INFO - __main__ - Step 10172: {'lr': 0.0004962489943230326, 'samples': 1953024, 'steps': 10171, 'loss/train': 1.2755616903305054} +11/06/2021 22:39:36 - INFO - __main__ - Step 10173: {'lr': 0.0004962480784439397, 'samples': 1953216, 'steps': 10172, 'loss/train': 1.9039602279663086} +11/06/2021 22:39:38 - INFO - __main__ - Step 10174: {'lr': 0.0004962471624538913, 'samples': 1953408, 'steps': 10173, 'loss/train': 2.694628953933716} +11/06/2021 22:39:38 - INFO - __main__ - Step 10175: {'lr': 0.0004962462463528875, 'samples': 1953600, 'steps': 10174, 'loss/train': 1.5455642938613892} +11/06/2021 22:39:38 - INFO - __main__ - Step 10176: {'lr': 0.0004962453301409291, 'samples': 1953792, 'steps': 10175, 'loss/train': 2.612506866455078} +11/06/2021 22:39:39 - INFO - __main__ - Step 10177: {'lr': 0.0004962444138180164, 'samples': 1953984, 'steps': 10176, 'loss/train': 1.5094280242919922} +11/06/2021 22:39:39 - INFO - __main__ - Step 10178: {'lr': 0.0004962434973841497, 'samples': 1954176, 'steps': 10177, 'loss/train': 1.740395426750183} +11/06/2021 22:39:39 - INFO - __main__ - Step 10179: {'lr': 0.0004962425808393295, 'samples': 1954368, 'steps': 10178, 'loss/train': 1.4363911151885986} +11/06/2021 22:39:40 - INFO - __main__ - Step 10180: {'lr': 0.000496241664183556, 'samples': 1954560, 'steps': 10179, 'loss/train': 1.8234004974365234} +11/06/2021 22:39:41 - INFO - __main__ - Step 10181: {'lr': 0.0004962407474168301, 'samples': 1954752, 'steps': 10180, 'loss/train': 2.219465970993042} +11/06/2021 22:39:41 - INFO - __main__ - Step 10182: {'lr': 0.0004962398305391518, 'samples': 1954944, 'steps': 10181, 'loss/train': 1.733228087425232} +11/06/2021 22:39:41 - INFO - __main__ - Step 10183: {'lr': 0.0004962389135505217, 'samples': 1955136, 'steps': 10182, 'loss/train': 1.9149515628814697} +11/06/2021 22:39:42 - INFO - __main__ - Step 10184: {'lr': 0.00049623799645094, 'samples': 1955328, 'steps': 10183, 'loss/train': 1.2486367225646973} +11/06/2021 22:39:43 - INFO - __main__ - Step 10185: {'lr': 0.0004962370792404073, 'samples': 1955520, 'steps': 10184, 'loss/train': 1.7573951482772827} +11/06/2021 22:39:43 - INFO - __main__ - Step 10186: {'lr': 0.000496236161918924, 'samples': 1955712, 'steps': 10185, 'loss/train': 2.166736125946045} +11/06/2021 22:39:43 - INFO - __main__ - Step 10187: {'lr': 0.0004962352444864904, 'samples': 1955904, 'steps': 10186, 'loss/train': 1.8243874311447144} +11/06/2021 22:39:44 - INFO - __main__ - Step 10188: {'lr': 0.0004962343269431072, 'samples': 1956096, 'steps': 10187, 'loss/train': 1.3378742933273315} +11/06/2021 22:39:44 - INFO - __main__ - Step 10189: {'lr': 0.0004962334092887744, 'samples': 1956288, 'steps': 10188, 'loss/train': 1.5770504474639893} +11/06/2021 22:39:45 - INFO - __main__ - Step 10190: {'lr': 0.0004962324915234928, 'samples': 1956480, 'steps': 10189, 'loss/train': 1.703421711921692} +11/06/2021 22:39:46 - INFO - __main__ - Step 10191: {'lr': 0.0004962315736472626, 'samples': 1956672, 'steps': 10190, 'loss/train': 1.7759064435958862} +11/06/2021 22:39:46 - INFO - __main__ - Step 10192: {'lr': 0.0004962306556600842, 'samples': 1956864, 'steps': 10191, 'loss/train': 1.7851485013961792} +11/06/2021 22:39:46 - INFO - __main__ - Step 10193: {'lr': 0.0004962297375619581, 'samples': 1957056, 'steps': 10192, 'loss/train': 1.8357267379760742} +11/06/2021 22:39:47 - INFO - __main__ - Step 10194: {'lr': 0.0004962288193528846, 'samples': 1957248, 'steps': 10193, 'loss/train': 1.8837649822235107} +11/06/2021 22:39:48 - INFO - __main__ - Step 10195: {'lr': 0.0004962279010328642, 'samples': 1957440, 'steps': 10194, 'loss/train': 1.5941526889801025} +11/06/2021 22:39:48 - INFO - __main__ - Step 10196: {'lr': 0.0004962269826018974, 'samples': 1957632, 'steps': 10195, 'loss/train': 1.2281931638717651} +11/06/2021 22:39:48 - INFO - __main__ - Step 10197: {'lr': 0.0004962260640599845, 'samples': 1957824, 'steps': 10196, 'loss/train': 1.6017422676086426} +11/06/2021 22:39:49 - INFO - __main__ - Step 10198: {'lr': 0.0004962251454071259, 'samples': 1958016, 'steps': 10197, 'loss/train': 1.4461283683776855} +11/06/2021 22:39:49 - INFO - __main__ - Step 10199: {'lr': 0.0004962242266433221, 'samples': 1958208, 'steps': 10198, 'loss/train': 1.918282151222229} +11/06/2021 22:39:51 - INFO - __main__ - Step 10200: {'lr': 0.0004962233077685734, 'samples': 1958400, 'steps': 10199, 'loss/train': 1.5870373249053955} +11/06/2021 22:39:51 - INFO - __main__ - Step 10201: {'lr': 0.0004962223887828803, 'samples': 1958592, 'steps': 10200, 'loss/train': 1.9776827096939087} +11/06/2021 22:39:52 - INFO - __main__ - Step 10202: {'lr': 0.0004962214696862432, 'samples': 1958784, 'steps': 10201, 'loss/train': 1.859332799911499} +11/06/2021 22:39:52 - INFO - __main__ - Step 10203: {'lr': 0.0004962205504786626, 'samples': 1958976, 'steps': 10202, 'loss/train': 1.5587915182113647} +11/06/2021 22:39:52 - INFO - __main__ - Step 10204: {'lr': 0.0004962196311601386, 'samples': 1959168, 'steps': 10203, 'loss/train': 2.007300615310669} +11/06/2021 22:39:53 - INFO - __main__ - Step 10205: {'lr': 0.000496218711730672, 'samples': 1959360, 'steps': 10204, 'loss/train': 1.5240142345428467} +11/06/2021 22:39:53 - INFO - __main__ - Step 10206: {'lr': 0.000496217792190263, 'samples': 1959552, 'steps': 10205, 'loss/train': 1.8262863159179688} +11/06/2021 22:39:54 - INFO - __main__ - Step 10207: {'lr': 0.0004962168725389121, 'samples': 1959744, 'steps': 10206, 'loss/train': 1.8134788274765015} +11/06/2021 22:39:54 - INFO - __main__ - Step 10208: {'lr': 0.0004962159527766196, 'samples': 1959936, 'steps': 10207, 'loss/train': 1.8182828426361084} +11/06/2021 22:39:55 - INFO - __main__ - Step 10209: {'lr': 0.000496215032903386, 'samples': 1960128, 'steps': 10208, 'loss/train': 2.6121604442596436} +11/06/2021 22:39:55 - INFO - __main__ - Step 10210: {'lr': 0.0004962141129192118, 'samples': 1960320, 'steps': 10209, 'loss/train': 1.8937207460403442} +11/06/2021 22:39:56 - INFO - __main__ - Step 10211: {'lr': 0.0004962131928240972, 'samples': 1960512, 'steps': 10210, 'loss/train': 2.1297640800476074} +11/06/2021 22:39:56 - INFO - __main__ - Step 10212: {'lr': 0.0004962122726180428, 'samples': 1960704, 'steps': 10211, 'loss/train': 1.8525015115737915} +11/06/2021 22:39:57 - INFO - __main__ - Step 10213: {'lr': 0.000496211352301049, 'samples': 1960896, 'steps': 10212, 'loss/train': 2.0309906005859375} +11/06/2021 22:39:57 - INFO - __main__ - Step 10214: {'lr': 0.0004962104318731161, 'samples': 1961088, 'steps': 10213, 'loss/train': 1.6677395105361938} +11/06/2021 22:39:58 - INFO - __main__ - Step 10215: {'lr': 0.0004962095113342445, 'samples': 1961280, 'steps': 10214, 'loss/train': 1.9678434133529663} +11/06/2021 22:39:58 - INFO - __main__ - Step 10216: {'lr': 0.0004962085906844348, 'samples': 1961472, 'steps': 10215, 'loss/train': 1.773742437362671} +11/06/2021 22:39:58 - INFO - __main__ - Step 10217: {'lr': 0.0004962076699236873, 'samples': 1961664, 'steps': 10216, 'loss/train': 1.3391557931900024} +11/06/2021 22:39:59 - INFO - __main__ - Step 10218: {'lr': 0.0004962067490520024, 'samples': 1961856, 'steps': 10217, 'loss/train': 1.5753556489944458} +11/06/2021 22:40:00 - INFO - __main__ - Step 10219: {'lr': 0.0004962058280693805, 'samples': 1962048, 'steps': 10218, 'loss/train': 1.1909321546554565} +11/06/2021 22:40:00 - INFO - __main__ - Step 10220: {'lr': 0.0004962049069758221, 'samples': 1962240, 'steps': 10219, 'loss/train': 2.3441052436828613} +11/06/2021 22:40:00 - INFO - __main__ - Step 10221: {'lr': 0.0004962039857713276, 'samples': 1962432, 'steps': 10220, 'loss/train': 2.0248935222625732} +11/06/2021 22:40:01 - INFO - __main__ - Step 10222: {'lr': 0.0004962030644558974, 'samples': 1962624, 'steps': 10221, 'loss/train': 2.0207021236419678} +11/06/2021 22:40:02 - INFO - __main__ - Step 10223: {'lr': 0.0004962021430295319, 'samples': 1962816, 'steps': 10222, 'loss/train': 2.0765750408172607} +11/06/2021 22:40:02 - INFO - __main__ - Step 10224: {'lr': 0.0004962012214922314, 'samples': 1963008, 'steps': 10223, 'loss/train': 1.82279372215271} +11/06/2021 22:40:02 - INFO - __main__ - Step 10225: {'lr': 0.0004962002998439966, 'samples': 1963200, 'steps': 10224, 'loss/train': 2.235682725906372} +11/06/2021 22:40:03 - INFO - __main__ - Step 10226: {'lr': 0.0004961993780848276, 'samples': 1963392, 'steps': 10225, 'loss/train': 1.372536301612854} +11/06/2021 22:40:03 - INFO - __main__ - Step 10227: {'lr': 0.000496198456214725, 'samples': 1963584, 'steps': 10226, 'loss/train': 2.1596105098724365} +11/06/2021 22:40:04 - INFO - __main__ - Step 10228: {'lr': 0.0004961975342336891, 'samples': 1963776, 'steps': 10227, 'loss/train': 1.9234440326690674} +11/06/2021 22:40:05 - INFO - __main__ - Step 10229: {'lr': 0.0004961966121417204, 'samples': 1963968, 'steps': 10228, 'loss/train': 1.7350918054580688} +11/06/2021 22:40:05 - INFO - __main__ - Step 10230: {'lr': 0.0004961956899388195, 'samples': 1964160, 'steps': 10229, 'loss/train': 1.6040425300598145} +11/06/2021 22:40:05 - INFO - __main__ - Step 10231: {'lr': 0.0004961947676249864, 'samples': 1964352, 'steps': 10230, 'loss/train': 1.6913650035858154} +11/06/2021 22:40:06 - INFO - __main__ - Step 10232: {'lr': 0.0004961938452002218, 'samples': 1964544, 'steps': 10231, 'loss/train': 1.3374961614608765} +11/06/2021 22:40:06 - INFO - __main__ - Step 10233: {'lr': 0.0004961929226645261, 'samples': 1964736, 'steps': 10232, 'loss/train': 1.7283188104629517} +11/06/2021 22:40:07 - INFO - __main__ - Step 10234: {'lr': 0.0004961920000178996, 'samples': 1964928, 'steps': 10233, 'loss/train': 1.5170456171035767} +11/06/2021 22:40:07 - INFO - __main__ - Step 10235: {'lr': 0.0004961910772603429, 'samples': 1965120, 'steps': 10234, 'loss/train': 1.6485928297042847} +11/06/2021 22:40:08 - INFO - __main__ - Step 10236: {'lr': 0.0004961901543918563, 'samples': 1965312, 'steps': 10235, 'loss/train': 1.1824220418930054} +11/06/2021 22:40:08 - INFO - __main__ - Step 10237: {'lr': 0.0004961892314124401, 'samples': 1965504, 'steps': 10236, 'loss/train': 1.3500611782073975} +11/06/2021 22:40:08 - INFO - __main__ - Step 10238: {'lr': 0.0004961883083220948, 'samples': 1965696, 'steps': 10237, 'loss/train': 1.5080724954605103} +11/06/2021 22:40:09 - INFO - __main__ - Step 10239: {'lr': 0.0004961873851208209, 'samples': 1965888, 'steps': 10238, 'loss/train': 1.8465136289596558} +11/06/2021 22:40:10 - INFO - __main__ - Step 10240: {'lr': 0.0004961864618086188, 'samples': 1966080, 'steps': 10239, 'loss/train': 1.8443377017974854} +11/06/2021 22:40:10 - INFO - __main__ - Step 10241: {'lr': 0.0004961855383854889, 'samples': 1966272, 'steps': 10240, 'loss/train': 1.4369864463806152} +11/06/2021 22:40:10 - INFO - __main__ - Step 10242: {'lr': 0.0004961846148514315, 'samples': 1966464, 'steps': 10241, 'loss/train': 1.790596842765808} +11/06/2021 22:40:11 - INFO - __main__ - Step 10243: {'lr': 0.0004961836912064472, 'samples': 1966656, 'steps': 10242, 'loss/train': 1.661517858505249} +11/06/2021 22:40:12 - INFO - __main__ - Step 10244: {'lr': 0.0004961827674505363, 'samples': 1966848, 'steps': 10243, 'loss/train': 0.9283877015113831} +11/06/2021 22:40:12 - INFO - __main__ - Step 10245: {'lr': 0.0004961818435836993, 'samples': 1967040, 'steps': 10244, 'loss/train': 2.5082814693450928} +11/06/2021 22:40:13 - INFO - __main__ - Step 10246: {'lr': 0.0004961809196059365, 'samples': 1967232, 'steps': 10245, 'loss/train': 0.8113244771957397} +11/06/2021 22:40:13 - INFO - __main__ - Step 10247: {'lr': 0.0004961799955172483, 'samples': 1967424, 'steps': 10246, 'loss/train': 1.7437840700149536} +11/06/2021 22:40:13 - INFO - __main__ - Step 10248: {'lr': 0.0004961790713176353, 'samples': 1967616, 'steps': 10247, 'loss/train': 1.9482618570327759} +11/06/2021 22:40:14 - INFO - __main__ - Step 10249: {'lr': 0.0004961781470070978, 'samples': 1967808, 'steps': 10248, 'loss/train': 1.7293133735656738} +11/06/2021 22:40:15 - INFO - __main__ - Step 10250: {'lr': 0.0004961772225856362, 'samples': 1968000, 'steps': 10249, 'loss/train': 1.6525590419769287} +11/06/2021 22:40:15 - INFO - __main__ - Step 10251: {'lr': 0.0004961762980532509, 'samples': 1968192, 'steps': 10250, 'loss/train': 1.758000135421753} +11/06/2021 22:40:15 - INFO - __main__ - Step 10252: {'lr': 0.0004961753734099425, 'samples': 1968384, 'steps': 10251, 'loss/train': 1.3765827417373657} +11/06/2021 22:40:16 - INFO - __main__ - Step 10253: {'lr': 0.0004961744486557112, 'samples': 1968576, 'steps': 10252, 'loss/train': 1.9734203815460205} +11/06/2021 22:40:17 - INFO - __main__ - Step 10254: {'lr': 0.0004961735237905574, 'samples': 1968768, 'steps': 10253, 'loss/train': 1.5639272928237915} +11/06/2021 22:40:17 - INFO - __main__ - Step 10255: {'lr': 0.0004961725988144816, 'samples': 1968960, 'steps': 10254, 'loss/train': 1.7732101678848267} +11/06/2021 22:40:17 - INFO - __main__ - Step 10256: {'lr': 0.0004961716737274844, 'samples': 1969152, 'steps': 10255, 'loss/train': 1.2973039150238037} +11/06/2021 22:40:18 - INFO - __main__ - Step 10257: {'lr': 0.0004961707485295659, 'samples': 1969344, 'steps': 10256, 'loss/train': 1.6465765237808228} +11/06/2021 22:40:18 - INFO - __main__ - Step 10258: {'lr': 0.0004961698232207268, 'samples': 1969536, 'steps': 10257, 'loss/train': 1.0470538139343262} +11/06/2021 22:40:18 - INFO - __main__ - Step 10259: {'lr': 0.0004961688978009672, 'samples': 1969728, 'steps': 10258, 'loss/train': 1.853024959564209} +11/06/2021 22:40:19 - INFO - __main__ - Step 10260: {'lr': 0.0004961679722702879, 'samples': 1969920, 'steps': 10259, 'loss/train': 1.3597272634506226} +11/06/2021 22:40:20 - INFO - __main__ - Step 10261: {'lr': 0.0004961670466286889, 'samples': 1970112, 'steps': 10260, 'loss/train': 1.9587664604187012} +11/06/2021 22:40:20 - INFO - __main__ - Step 10262: {'lr': 0.000496166120876171, 'samples': 1970304, 'steps': 10261, 'loss/train': 1.988135814666748} +11/06/2021 22:40:21 - INFO - __main__ - Step 10263: {'lr': 0.0004961651950127343, 'samples': 1970496, 'steps': 10262, 'loss/train': 1.9414300918579102} +11/06/2021 22:40:21 - INFO - __main__ - Step 10264: {'lr': 0.0004961642690383794, 'samples': 1970688, 'steps': 10263, 'loss/train': 1.9191449880599976} +11/06/2021 22:40:22 - INFO - __main__ - Step 10265: {'lr': 0.0004961633429531068, 'samples': 1970880, 'steps': 10264, 'loss/train': 2.015342950820923} +11/06/2021 22:40:22 - INFO - __main__ - Step 10266: {'lr': 0.0004961624167569166, 'samples': 1971072, 'steps': 10265, 'loss/train': 1.3776711225509644} +11/06/2021 22:40:23 - INFO - __main__ - Step 10267: {'lr': 0.0004961614904498095, 'samples': 1971264, 'steps': 10266, 'loss/train': 2.4013566970825195} +11/06/2021 22:40:23 - INFO - __main__ - Step 10268: {'lr': 0.0004961605640317858, 'samples': 1971456, 'steps': 10267, 'loss/train': 1.6062275171279907} +11/06/2021 22:40:23 - INFO - __main__ - Step 10269: {'lr': 0.0004961596375028461, 'samples': 1971648, 'steps': 10268, 'loss/train': 1.3712677955627441} +11/06/2021 22:40:24 - INFO - __main__ - Step 10270: {'lr': 0.0004961587108629906, 'samples': 1971840, 'steps': 10269, 'loss/train': 1.1406784057617188} +11/06/2021 22:40:25 - INFO - __main__ - Step 10271: {'lr': 0.0004961577841122197, 'samples': 1972032, 'steps': 10270, 'loss/train': 1.5826045274734497} +11/06/2021 22:40:25 - INFO - __main__ - Step 10272: {'lr': 0.000496156857250534, 'samples': 1972224, 'steps': 10271, 'loss/train': 1.612403154373169} +11/06/2021 22:40:25 - INFO - __main__ - Step 10273: {'lr': 0.0004961559302779338, 'samples': 1972416, 'steps': 10272, 'loss/train': 1.9364298582077026} +11/06/2021 22:40:26 - INFO - __main__ - Step 10274: {'lr': 0.0004961550031944194, 'samples': 1972608, 'steps': 10273, 'loss/train': 1.6951217651367188} +11/06/2021 22:40:27 - INFO - __main__ - Step 10275: {'lr': 0.0004961540759999914, 'samples': 1972800, 'steps': 10274, 'loss/train': 2.1520490646362305} +11/06/2021 22:40:27 - INFO - __main__ - Step 10276: {'lr': 0.0004961531486946502, 'samples': 1972992, 'steps': 10275, 'loss/train': 1.9737766981124878} +11/06/2021 22:40:28 - INFO - __main__ - Step 10277: {'lr': 0.0004961522212783962, 'samples': 1973184, 'steps': 10276, 'loss/train': 1.5989540815353394} +11/06/2021 22:40:28 - INFO - __main__ - Step 10278: {'lr': 0.00049615129375123, 'samples': 1973376, 'steps': 10277, 'loss/train': 0.26742538809776306} +11/06/2021 22:40:29 - INFO - __main__ - Step 10279: {'lr': 0.0004961503661131515, 'samples': 1973568, 'steps': 10278, 'loss/train': 1.548420786857605} +11/06/2021 22:40:30 - INFO - __main__ - Step 10280: {'lr': 0.0004961494383641616, 'samples': 1973760, 'steps': 10279, 'loss/train': 1.5787936449050903} +11/06/2021 22:40:30 - INFO - __main__ - Step 10281: {'lr': 0.0004961485105042606, 'samples': 1973952, 'steps': 10280, 'loss/train': 2.117009401321411} +11/06/2021 22:40:30 - INFO - __main__ - Step 10282: {'lr': 0.0004961475825334488, 'samples': 1974144, 'steps': 10281, 'loss/train': 1.2511065006256104} +11/06/2021 22:40:31 - INFO - __main__ - Step 10283: {'lr': 0.0004961466544517267, 'samples': 1974336, 'steps': 10282, 'loss/train': 2.109795570373535} +11/06/2021 22:40:31 - INFO - __main__ - Step 10284: {'lr': 0.0004961457262590948, 'samples': 1974528, 'steps': 10283, 'loss/train': 1.5047543048858643} +11/06/2021 22:40:31 - INFO - __main__ - Step 10285: {'lr': 0.0004961447979555533, 'samples': 1974720, 'steps': 10284, 'loss/train': 1.6194933652877808} +11/06/2021 22:40:32 - INFO - __main__ - Step 10286: {'lr': 0.000496143869541103, 'samples': 1974912, 'steps': 10285, 'loss/train': 1.41692054271698} +11/06/2021 22:40:33 - INFO - __main__ - Step 10287: {'lr': 0.0004961429410157437, 'samples': 1975104, 'steps': 10286, 'loss/train': 1.688002586364746} +11/06/2021 22:40:33 - INFO - __main__ - Step 10288: {'lr': 0.0004961420123794764, 'samples': 1975296, 'steps': 10287, 'loss/train': 1.7760323286056519} +11/06/2021 22:40:34 - INFO - __main__ - Step 10289: {'lr': 0.0004961410836323014, 'samples': 1975488, 'steps': 10288, 'loss/train': 1.8118081092834473} +11/06/2021 22:40:34 - INFO - __main__ - Step 10290: {'lr': 0.0004961401547742189, 'samples': 1975680, 'steps': 10289, 'loss/train': 1.0009771585464478} +11/06/2021 22:40:35 - INFO - __main__ - Step 10291: {'lr': 0.0004961392258052294, 'samples': 1975872, 'steps': 10290, 'loss/train': 1.9054882526397705} +11/06/2021 22:40:35 - INFO - __main__ - Step 10292: {'lr': 0.0004961382967253335, 'samples': 1976064, 'steps': 10291, 'loss/train': 1.815101981163025} +11/06/2021 22:40:36 - INFO - __main__ - Step 10293: {'lr': 0.0004961373675345315, 'samples': 1976256, 'steps': 10292, 'loss/train': 1.6685025691986084} +11/06/2021 22:40:36 - INFO - __main__ - Step 10294: {'lr': 0.0004961364382328236, 'samples': 1976448, 'steps': 10293, 'loss/train': 1.8122519254684448} +11/06/2021 22:40:36 - INFO - __main__ - Step 10295: {'lr': 0.0004961355088202106, 'samples': 1976640, 'steps': 10294, 'loss/train': 1.760857105255127} +11/06/2021 22:40:37 - INFO - __main__ - Step 10296: {'lr': 0.0004961345792966926, 'samples': 1976832, 'steps': 10295, 'loss/train': 2.0797855854034424} +11/06/2021 22:40:38 - INFO - __main__ - Step 10297: {'lr': 0.0004961336496622702, 'samples': 1977024, 'steps': 10296, 'loss/train': 0.4716089367866516} +11/06/2021 22:40:38 - INFO - __main__ - Step 10298: {'lr': 0.0004961327199169438, 'samples': 1977216, 'steps': 10297, 'loss/train': 1.8852925300598145} +11/06/2021 22:40:39 - INFO - __main__ - Step 10299: {'lr': 0.0004961317900607138, 'samples': 1977408, 'steps': 10298, 'loss/train': 2.788236141204834} +11/06/2021 22:40:39 - INFO - __main__ - Step 10300: {'lr': 0.0004961308600935807, 'samples': 1977600, 'steps': 10299, 'loss/train': 1.8009984493255615} +11/06/2021 22:40:39 - INFO - __main__ - Step 10301: {'lr': 0.0004961299300155446, 'samples': 1977792, 'steps': 10300, 'loss/train': 1.9995626211166382} +11/06/2021 22:40:40 - INFO - __main__ - Step 10302: {'lr': 0.0004961289998266064, 'samples': 1977984, 'steps': 10301, 'loss/train': 1.1890935897827148} +11/06/2021 22:40:41 - INFO - __main__ - Step 10303: {'lr': 0.0004961280695267662, 'samples': 1978176, 'steps': 10302, 'loss/train': 1.4275264739990234} +11/06/2021 22:40:41 - INFO - __main__ - Step 10304: {'lr': 0.0004961271391160243, 'samples': 1978368, 'steps': 10303, 'loss/train': 1.8430927991867065} +11/06/2021 22:40:41 - INFO - __main__ - Step 10305: {'lr': 0.0004961262085943815, 'samples': 1978560, 'steps': 10304, 'loss/train': 1.3772211074829102} +11/06/2021 22:40:42 - INFO - __main__ - Step 10306: {'lr': 0.000496125277961838, 'samples': 1978752, 'steps': 10305, 'loss/train': 1.3290560245513916} +11/06/2021 22:40:43 - INFO - __main__ - Step 10307: {'lr': 0.0004961243472183942, 'samples': 1978944, 'steps': 10306, 'loss/train': 1.4642337560653687} +11/06/2021 22:40:43 - INFO - __main__ - Step 10308: {'lr': 0.0004961234163640507, 'samples': 1979136, 'steps': 10307, 'loss/train': 1.9507293701171875} +11/06/2021 22:40:43 - INFO - __main__ - Step 10309: {'lr': 0.0004961224853988076, 'samples': 1979328, 'steps': 10308, 'loss/train': 2.0494842529296875} +11/06/2021 22:40:44 - INFO - __main__ - Step 10310: {'lr': 0.0004961215543226657, 'samples': 1979520, 'steps': 10309, 'loss/train': 1.839885950088501} +11/06/2021 22:40:44 - INFO - __main__ - Step 10311: {'lr': 0.0004961206231356251, 'samples': 1979712, 'steps': 10310, 'loss/train': 1.5155304670333862} +11/06/2021 22:40:45 - INFO - __main__ - Step 10312: {'lr': 0.0004961196918376864, 'samples': 1979904, 'steps': 10311, 'loss/train': 1.361377239227295} +11/06/2021 22:40:46 - INFO - __main__ - Step 10313: {'lr': 0.0004961187604288498, 'samples': 1980096, 'steps': 10312, 'loss/train': 1.2928553819656372} +11/06/2021 22:40:46 - INFO - __main__ - Step 10314: {'lr': 0.0004961178289091161, 'samples': 1980288, 'steps': 10313, 'loss/train': 1.8654111623764038} +11/06/2021 22:40:46 - INFO - __main__ - Step 10315: {'lr': 0.0004961168972784855, 'samples': 1980480, 'steps': 10314, 'loss/train': 1.5969183444976807} +11/06/2021 22:40:47 - INFO - __main__ - Step 10316: {'lr': 0.0004961159655369582, 'samples': 1980672, 'steps': 10315, 'loss/train': 1.5698388814926147} +11/06/2021 22:40:48 - INFO - __main__ - Step 10317: {'lr': 0.0004961150336845351, 'samples': 1980864, 'steps': 10316, 'loss/train': 1.988451600074768} +11/06/2021 22:40:48 - INFO - __main__ - Step 10318: {'lr': 0.0004961141017212162, 'samples': 1981056, 'steps': 10317, 'loss/train': 1.8295103311538696} +11/06/2021 22:40:48 - INFO - __main__ - Step 10319: {'lr': 0.0004961131696470021, 'samples': 1981248, 'steps': 10318, 'loss/train': 1.9807548522949219} +11/06/2021 22:40:49 - INFO - __main__ - Step 10320: {'lr': 0.0004961122374618933, 'samples': 1981440, 'steps': 10319, 'loss/train': 1.6604183912277222} +11/06/2021 22:40:49 - INFO - __main__ - Step 10321: {'lr': 0.00049611130516589, 'samples': 1981632, 'steps': 10320, 'loss/train': 1.369404911994934} +11/06/2021 22:40:49 - INFO - __main__ - Step 10322: {'lr': 0.0004961103727589929, 'samples': 1981824, 'steps': 10321, 'loss/train': 1.0568779706954956} +11/06/2021 22:40:50 - INFO - __main__ - Step 10323: {'lr': 0.0004961094402412021, 'samples': 1982016, 'steps': 10322, 'loss/train': 1.5058151483535767} +11/06/2021 22:40:51 - INFO - __main__ - Step 10324: {'lr': 0.0004961085076125182, 'samples': 1982208, 'steps': 10323, 'loss/train': 1.933563470840454} +11/06/2021 22:40:51 - INFO - __main__ - Step 10325: {'lr': 0.0004961075748729418, 'samples': 1982400, 'steps': 10324, 'loss/train': 1.765858769416809} +11/06/2021 22:40:51 - INFO - __main__ - Step 10326: {'lr': 0.0004961066420224729, 'samples': 1982592, 'steps': 10325, 'loss/train': 1.309130072593689} +11/06/2021 22:40:52 - INFO - __main__ - Step 10327: {'lr': 0.0004961057090611123, 'samples': 1982784, 'steps': 10326, 'loss/train': 1.8366987705230713} +11/06/2021 22:40:53 - INFO - __main__ - Step 10328: {'lr': 0.0004961047759888601, 'samples': 1982976, 'steps': 10327, 'loss/train': 1.7899473905563354} +11/06/2021 22:40:53 - INFO - __main__ - Step 10329: {'lr': 0.000496103842805717, 'samples': 1983168, 'steps': 10328, 'loss/train': 1.4649665355682373} +11/06/2021 22:40:54 - INFO - __main__ - Step 10330: {'lr': 0.0004961029095116833, 'samples': 1983360, 'steps': 10329, 'loss/train': 2.0712430477142334} +11/06/2021 22:40:54 - INFO - __main__ - Step 10331: {'lr': 0.0004961019761067594, 'samples': 1983552, 'steps': 10330, 'loss/train': 2.5029542446136475} +11/06/2021 22:40:54 - INFO - __main__ - Step 10332: {'lr': 0.0004961010425909458, 'samples': 1983744, 'steps': 10331, 'loss/train': 2.1280171871185303} +11/06/2021 22:40:55 - INFO - __main__ - Step 10333: {'lr': 0.0004961001089642428, 'samples': 1983936, 'steps': 10332, 'loss/train': 1.8614065647125244} +11/06/2021 22:40:56 - INFO - __main__ - Step 10334: {'lr': 0.000496099175226651, 'samples': 1984128, 'steps': 10333, 'loss/train': 2.124863862991333} +11/06/2021 22:40:56 - INFO - __main__ - Step 10335: {'lr': 0.0004960982413781705, 'samples': 1984320, 'steps': 10334, 'loss/train': 1.0853912830352783} +11/06/2021 22:40:56 - INFO - __main__ - Step 10336: {'lr': 0.0004960973074188021, 'samples': 1984512, 'steps': 10335, 'loss/train': 1.535399317741394} +11/06/2021 22:40:57 - INFO - __main__ - Step 10337: {'lr': 0.000496096373348546, 'samples': 1984704, 'steps': 10336, 'loss/train': 1.792807936668396} +11/06/2021 22:40:58 - INFO - __main__ - Step 10338: {'lr': 0.0004960954391674026, 'samples': 1984896, 'steps': 10337, 'loss/train': 1.693973183631897} +11/06/2021 22:40:58 - INFO - __main__ - Step 10339: {'lr': 0.0004960945048753725, 'samples': 1985088, 'steps': 10338, 'loss/train': 2.293344020843506} +11/06/2021 22:40:58 - INFO - __main__ - Step 10340: {'lr': 0.000496093570472456, 'samples': 1985280, 'steps': 10339, 'loss/train': 1.3442373275756836} +11/06/2021 22:40:59 - INFO - __main__ - Step 10341: {'lr': 0.0004960926359586535, 'samples': 1985472, 'steps': 10340, 'loss/train': 1.554911732673645} +11/06/2021 22:40:59 - INFO - __main__ - Step 10342: {'lr': 0.0004960917013339656, 'samples': 1985664, 'steps': 10341, 'loss/train': 2.2928225994110107} +11/06/2021 22:41:00 - INFO - __main__ - Step 10343: {'lr': 0.0004960907665983923, 'samples': 1985856, 'steps': 10342, 'loss/train': 1.8382941484451294} +11/06/2021 22:41:00 - INFO - __main__ - Step 10344: {'lr': 0.0004960898317519345, 'samples': 1986048, 'steps': 10343, 'loss/train': 1.9304149150848389} +11/06/2021 22:41:01 - INFO - __main__ - Step 10345: {'lr': 0.0004960888967945924, 'samples': 1986240, 'steps': 10344, 'loss/train': 1.7264574766159058} +11/06/2021 22:41:01 - INFO - __main__ - Step 10346: {'lr': 0.0004960879617263664, 'samples': 1986432, 'steps': 10345, 'loss/train': 1.2233792543411255} +11/06/2021 22:41:02 - INFO - __main__ - Step 10347: {'lr': 0.000496087026547257, 'samples': 1986624, 'steps': 10346, 'loss/train': 1.9374359846115112} +11/06/2021 22:41:02 - INFO - __main__ - Step 10348: {'lr': 0.0004960860912572645, 'samples': 1986816, 'steps': 10347, 'loss/train': 1.7407712936401367} +11/06/2021 22:41:03 - INFO - __main__ - Step 10349: {'lr': 0.0004960851558563895, 'samples': 1987008, 'steps': 10348, 'loss/train': 1.7582014799118042} +11/06/2021 22:41:04 - INFO - __main__ - Step 10350: {'lr': 0.0004960842203446322, 'samples': 1987200, 'steps': 10349, 'loss/train': 0.7253603935241699} +11/06/2021 22:41:04 - INFO - __main__ - Step 10351: {'lr': 0.0004960832847219933, 'samples': 1987392, 'steps': 10350, 'loss/train': 1.7652232646942139} +11/06/2021 22:41:04 - INFO - __main__ - Step 10352: {'lr': 0.000496082348988473, 'samples': 1987584, 'steps': 10351, 'loss/train': 1.9226405620574951} +11/06/2021 22:41:05 - INFO - __main__ - Step 10353: {'lr': 0.0004960814131440717, 'samples': 1987776, 'steps': 10352, 'loss/train': 2.1182456016540527} +11/06/2021 22:41:06 - INFO - __main__ - Step 10354: {'lr': 0.0004960804771887901, 'samples': 1987968, 'steps': 10353, 'loss/train': 1.939481496810913} +11/06/2021 22:41:06 - INFO - __main__ - Step 10355: {'lr': 0.0004960795411226283, 'samples': 1988160, 'steps': 10354, 'loss/train': 2.0060768127441406} +11/06/2021 22:41:06 - INFO - __main__ - Step 10356: {'lr': 0.0004960786049455868, 'samples': 1988352, 'steps': 10355, 'loss/train': 1.5645967721939087} +11/06/2021 22:41:07 - INFO - __main__ - Step 10357: {'lr': 0.0004960776686576663, 'samples': 1988544, 'steps': 10356, 'loss/train': 1.7053444385528564} +11/06/2021 22:41:07 - INFO - __main__ - Step 10358: {'lr': 0.0004960767322588668, 'samples': 1988736, 'steps': 10357, 'loss/train': 1.8968679904937744} +11/06/2021 22:41:08 - INFO - __main__ - Step 10359: {'lr': 0.000496075795749189, 'samples': 1988928, 'steps': 10358, 'loss/train': 1.6383986473083496} +11/06/2021 22:41:08 - INFO - __main__ - Step 10360: {'lr': 0.0004960748591286332, 'samples': 1989120, 'steps': 10359, 'loss/train': 2.3410348892211914} +11/06/2021 22:41:09 - INFO - __main__ - Step 10361: {'lr': 0.0004960739223971999, 'samples': 1989312, 'steps': 10360, 'loss/train': 2.367793560028076} +11/06/2021 22:41:09 - INFO - __main__ - Step 10362: {'lr': 0.0004960729855548895, 'samples': 1989504, 'steps': 10361, 'loss/train': 1.650147795677185} +11/06/2021 22:41:10 - INFO - __main__ - Step 10363: {'lr': 0.0004960720486017025, 'samples': 1989696, 'steps': 10362, 'loss/train': 0.8240565657615662} +11/06/2021 22:41:11 - INFO - __main__ - Step 10364: {'lr': 0.0004960711115376391, 'samples': 1989888, 'steps': 10363, 'loss/train': 2.253253698348999} +11/06/2021 22:41:11 - INFO - __main__ - Step 10365: {'lr': 0.0004960701743626999, 'samples': 1990080, 'steps': 10364, 'loss/train': 1.3892946243286133} +11/06/2021 22:41:11 - INFO - __main__ - Step 10366: {'lr': 0.0004960692370768853, 'samples': 1990272, 'steps': 10365, 'loss/train': 1.6433247327804565} +11/06/2021 22:41:12 - INFO - __main__ - Step 10367: {'lr': 0.0004960682996801956, 'samples': 1990464, 'steps': 10366, 'loss/train': 1.6244982481002808} +11/06/2021 22:41:12 - INFO - __main__ - Step 10368: {'lr': 0.0004960673621726314, 'samples': 1990656, 'steps': 10367, 'loss/train': 1.839497685432434} +11/06/2021 22:41:13 - INFO - __main__ - Step 10369: {'lr': 0.000496066424554193, 'samples': 1990848, 'steps': 10368, 'loss/train': 1.401164174079895} +11/06/2021 22:41:14 - INFO - __main__ - Step 10370: {'lr': 0.0004960654868248809, 'samples': 1991040, 'steps': 10369, 'loss/train': 2.057040214538574} +11/06/2021 22:41:14 - INFO - __main__ - Step 10371: {'lr': 0.0004960645489846955, 'samples': 1991232, 'steps': 10370, 'loss/train': 2.0657546520233154} +11/06/2021 22:41:14 - INFO - __main__ - Step 10372: {'lr': 0.0004960636110336371, 'samples': 1991424, 'steps': 10371, 'loss/train': 1.8819034099578857} +11/06/2021 22:41:15 - INFO - __main__ - Step 10373: {'lr': 0.0004960626729717064, 'samples': 1991616, 'steps': 10372, 'loss/train': 1.3991193771362305} +11/06/2021 22:41:15 - INFO - __main__ - Step 10374: {'lr': 0.0004960617347989036, 'samples': 1991808, 'steps': 10373, 'loss/train': 1.9511737823486328} +11/06/2021 22:41:17 - INFO - __main__ - Step 10375: {'lr': 0.0004960607965152292, 'samples': 1992000, 'steps': 10374, 'loss/train': 1.4117087125778198} +11/06/2021 22:41:17 - INFO - __main__ - Step 10376: {'lr': 0.0004960598581206835, 'samples': 1992192, 'steps': 10375, 'loss/train': 1.0104448795318604} +11/06/2021 22:41:18 - INFO - __main__ - Step 10377: {'lr': 0.000496058919615267, 'samples': 1992384, 'steps': 10376, 'loss/train': 1.3164684772491455} +11/06/2021 22:41:18 - INFO - __main__ - Step 10378: {'lr': 0.0004960579809989803, 'samples': 1992576, 'steps': 10377, 'loss/train': 1.1793992519378662} +11/06/2021 22:41:19 - INFO - __main__ - Step 10379: {'lr': 0.0004960570422718237, 'samples': 1992768, 'steps': 10378, 'loss/train': 0.8159379959106445} +11/06/2021 22:41:19 - INFO - __main__ - Step 10380: {'lr': 0.0004960561034337975, 'samples': 1992960, 'steps': 10379, 'loss/train': 2.050475835800171} +11/06/2021 22:41:19 - INFO - __main__ - Step 10381: {'lr': 0.0004960551644849022, 'samples': 1993152, 'steps': 10380, 'loss/train': 1.5734912157058716} +11/06/2021 22:41:20 - INFO - __main__ - Step 10382: {'lr': 0.0004960542254251382, 'samples': 1993344, 'steps': 10381, 'loss/train': 1.4547319412231445} +11/06/2021 22:41:21 - INFO - __main__ - Step 10383: {'lr': 0.0004960532862545061, 'samples': 1993536, 'steps': 10382, 'loss/train': 1.9347224235534668} +11/06/2021 22:41:21 - INFO - __main__ - Step 10384: {'lr': 0.0004960523469730061, 'samples': 1993728, 'steps': 10383, 'loss/train': 1.8350725173950195} +11/06/2021 22:41:21 - INFO - __main__ - Step 10385: {'lr': 0.0004960514075806387, 'samples': 1993920, 'steps': 10384, 'loss/train': 2.118435859680176} +11/06/2021 22:41:22 - INFO - __main__ - Step 10386: {'lr': 0.0004960504680774043, 'samples': 1994112, 'steps': 10385, 'loss/train': 1.8689095973968506} +11/06/2021 22:41:23 - INFO - __main__ - Step 10387: {'lr': 0.0004960495284633034, 'samples': 1994304, 'steps': 10386, 'loss/train': 0.7011041045188904} +11/06/2021 22:41:23 - INFO - __main__ - Step 10388: {'lr': 0.0004960485887383363, 'samples': 1994496, 'steps': 10387, 'loss/train': 1.9033364057540894} +11/06/2021 22:41:23 - INFO - __main__ - Step 10389: {'lr': 0.0004960476489025037, 'samples': 1994688, 'steps': 10388, 'loss/train': 1.7955809831619263} +11/06/2021 22:41:24 - INFO - __main__ - Step 10390: {'lr': 0.0004960467089558057, 'samples': 1994880, 'steps': 10389, 'loss/train': 1.9313750267028809} +11/06/2021 22:41:24 - INFO - __main__ - Step 10391: {'lr': 0.0004960457688982428, 'samples': 1995072, 'steps': 10390, 'loss/train': 1.3544516563415527} +11/06/2021 22:41:25 - INFO - __main__ - Step 10392: {'lr': 0.0004960448287298156, 'samples': 1995264, 'steps': 10391, 'loss/train': 1.409073829650879} +11/06/2021 22:41:26 - INFO - __main__ - Step 10393: {'lr': 0.0004960438884505242, 'samples': 1995456, 'steps': 10392, 'loss/train': 1.8170816898345947} +11/06/2021 22:41:26 - INFO - __main__ - Step 10394: {'lr': 0.0004960429480603694, 'samples': 1995648, 'steps': 10393, 'loss/train': 1.6994777917861938} +11/06/2021 22:41:26 - INFO - __main__ - Step 10395: {'lr': 0.0004960420075593515, 'samples': 1995840, 'steps': 10394, 'loss/train': 1.7487272024154663} +11/06/2021 22:41:27 - INFO - __main__ - Step 10396: {'lr': 0.0004960410669474708, 'samples': 1996032, 'steps': 10395, 'loss/train': 1.8390122652053833} +11/06/2021 22:41:28 - INFO - __main__ - Step 10397: {'lr': 0.0004960401262247277, 'samples': 1996224, 'steps': 10396, 'loss/train': 1.0365424156188965} +11/06/2021 22:41:28 - INFO - __main__ - Step 10398: {'lr': 0.0004960391853911228, 'samples': 1996416, 'steps': 10397, 'loss/train': 1.6385880708694458} +11/06/2021 22:41:29 - INFO - __main__ - Step 10399: {'lr': 0.0004960382444466564, 'samples': 1996608, 'steps': 10398, 'loss/train': 1.1302746534347534} +11/06/2021 22:41:29 - INFO - __main__ - Step 10400: {'lr': 0.0004960373033913289, 'samples': 1996800, 'steps': 10399, 'loss/train': 1.6192007064819336} +11/06/2021 22:41:29 - INFO - __main__ - Step 10401: {'lr': 0.0004960363622251409, 'samples': 1996992, 'steps': 10400, 'loss/train': 1.7356743812561035} +11/06/2021 22:41:30 - INFO - __main__ - Step 10402: {'lr': 0.0004960354209480927, 'samples': 1997184, 'steps': 10401, 'loss/train': 1.772154688835144} +11/06/2021 22:41:31 - INFO - __main__ - Step 10403: {'lr': 0.0004960344795601847, 'samples': 1997376, 'steps': 10402, 'loss/train': 2.327993869781494} +11/06/2021 22:41:31 - INFO - __main__ - Step 10404: {'lr': 0.0004960335380614174, 'samples': 1997568, 'steps': 10403, 'loss/train': 1.9825865030288696} +11/06/2021 22:41:31 - INFO - __main__ - Step 10405: {'lr': 0.0004960325964517912, 'samples': 1997760, 'steps': 10404, 'loss/train': 1.8894060850143433} +11/06/2021 22:41:32 - INFO - __main__ - Step 10406: {'lr': 0.0004960316547313064, 'samples': 1997952, 'steps': 10405, 'loss/train': 1.8726656436920166} +11/06/2021 22:41:33 - INFO - __main__ - Step 10407: {'lr': 0.0004960307128999636, 'samples': 1998144, 'steps': 10406, 'loss/train': 1.447789192199707} +11/06/2021 22:41:33 - INFO - __main__ - Step 10408: {'lr': 0.0004960297709577632, 'samples': 1998336, 'steps': 10407, 'loss/train': 2.224510431289673} +11/06/2021 22:41:34 - INFO - __main__ - Step 10409: {'lr': 0.0004960288289047054, 'samples': 1998528, 'steps': 10408, 'loss/train': 1.373806118965149} +11/06/2021 22:41:34 - INFO - __main__ - Step 10410: {'lr': 0.000496027886740791, 'samples': 1998720, 'steps': 10409, 'loss/train': 1.4621202945709229} +11/06/2021 22:41:34 - INFO - __main__ - Step 10411: {'lr': 0.0004960269444660201, 'samples': 1998912, 'steps': 10410, 'loss/train': 1.9223895072937012} +11/06/2021 22:41:35 - INFO - __main__ - Step 10412: {'lr': 0.0004960260020803934, 'samples': 1999104, 'steps': 10411, 'loss/train': 1.9031519889831543} +11/06/2021 22:41:36 - INFO - __main__ - Step 10413: {'lr': 0.0004960250595839111, 'samples': 1999296, 'steps': 10412, 'loss/train': 1.6633156538009644} +11/06/2021 22:41:36 - INFO - __main__ - Step 10414: {'lr': 0.0004960241169765737, 'samples': 1999488, 'steps': 10413, 'loss/train': 1.947817087173462} +11/06/2021 22:41:36 - INFO - __main__ - Step 10415: {'lr': 0.0004960231742583817, 'samples': 1999680, 'steps': 10414, 'loss/train': 1.6474344730377197} +11/06/2021 22:41:37 - INFO - __main__ - Step 10416: {'lr': 0.0004960222314293354, 'samples': 1999872, 'steps': 10415, 'loss/train': 1.6221576929092407} +11/06/2021 22:41:37 - INFO - __main__ - Step 10417: {'lr': 0.0004960212884894353, 'samples': 2000064, 'steps': 10416, 'loss/train': 1.5149108171463013} +11/06/2021 22:41:38 - INFO - __main__ - Step 10418: {'lr': 0.0004960203454386817, 'samples': 2000256, 'steps': 10417, 'loss/train': 0.9100244641304016} +11/06/2021 22:41:38 - INFO - __main__ - Step 10419: {'lr': 0.0004960194022770753, 'samples': 2000448, 'steps': 10418, 'loss/train': 1.549153447151184} +11/06/2021 22:41:39 - INFO - __main__ - Step 10420: {'lr': 0.0004960184590046162, 'samples': 2000640, 'steps': 10419, 'loss/train': 1.8034104108810425} +11/06/2021 22:41:39 - INFO - __main__ - Step 10421: {'lr': 0.0004960175156213051, 'samples': 2000832, 'steps': 10420, 'loss/train': 0.9687737226486206} +11/06/2021 22:41:39 - INFO - __main__ - Step 10422: {'lr': 0.0004960165721271422, 'samples': 2001024, 'steps': 10421, 'loss/train': 1.8846495151519775} +11/06/2021 22:41:41 - INFO - __main__ - Step 10423: {'lr': 0.000496015628522128, 'samples': 2001216, 'steps': 10422, 'loss/train': 1.9125192165374756} +11/06/2021 22:41:41 - INFO - __main__ - Step 10424: {'lr': 0.000496014684806263, 'samples': 2001408, 'steps': 10423, 'loss/train': 1.8119043111801147} +11/06/2021 22:41:41 - INFO - __main__ - Step 10425: {'lr': 0.0004960137409795477, 'samples': 2001600, 'steps': 10424, 'loss/train': 2.1726603507995605} +11/06/2021 22:41:42 - INFO - __main__ - Step 10426: {'lr': 0.0004960127970419822, 'samples': 2001792, 'steps': 10425, 'loss/train': 1.9231642484664917} +11/06/2021 22:41:42 - INFO - __main__ - Step 10427: {'lr': 0.0004960118529935674, 'samples': 2001984, 'steps': 10426, 'loss/train': 2.1175436973571777} +11/06/2021 22:41:43 - INFO - __main__ - Step 10428: {'lr': 0.0004960109088343032, 'samples': 2002176, 'steps': 10427, 'loss/train': 2.0986135005950928} +11/06/2021 22:41:43 - INFO - __main__ - Step 10429: {'lr': 0.0004960099645641903, 'samples': 2002368, 'steps': 10428, 'loss/train': 1.7129641771316528} +11/06/2021 22:41:44 - INFO - __main__ - Step 10430: {'lr': 0.0004960090201832293, 'samples': 2002560, 'steps': 10429, 'loss/train': 1.1784454584121704} +11/06/2021 22:41:44 - INFO - __main__ - Step 10431: {'lr': 0.0004960080756914203, 'samples': 2002752, 'steps': 10430, 'loss/train': 1.253516674041748} +11/06/2021 22:41:44 - INFO - __main__ - Step 10432: {'lr': 0.0004960071310887638, 'samples': 2002944, 'steps': 10431, 'loss/train': 1.8971530199050903} +11/06/2021 22:41:45 - INFO - __main__ - Step 10433: {'lr': 0.0004960061863752604, 'samples': 2003136, 'steps': 10432, 'loss/train': 2.065613031387329} +11/06/2021 22:41:46 - INFO - __main__ - Step 10434: {'lr': 0.0004960052415509103, 'samples': 2003328, 'steps': 10433, 'loss/train': 1.7110601663589478} +11/06/2021 22:41:46 - INFO - __main__ - Step 10435: {'lr': 0.0004960042966157141, 'samples': 2003520, 'steps': 10434, 'loss/train': 1.3858282566070557} +11/06/2021 22:41:47 - INFO - __main__ - Step 10436: {'lr': 0.0004960033515696722, 'samples': 2003712, 'steps': 10435, 'loss/train': 1.303482174873352} +11/06/2021 22:41:47 - INFO - __main__ - Step 10437: {'lr': 0.0004960024064127849, 'samples': 2003904, 'steps': 10436, 'loss/train': 1.2062408924102783} +11/06/2021 22:41:47 - INFO - __main__ - Step 10438: {'lr': 0.0004960014611450527, 'samples': 2004096, 'steps': 10437, 'loss/train': 1.7718604803085327} +11/06/2021 22:41:48 - INFO - __main__ - Step 10439: {'lr': 0.0004960005157664762, 'samples': 2004288, 'steps': 10438, 'loss/train': 1.6597301959991455} +11/06/2021 22:41:49 - INFO - __main__ - Step 10440: {'lr': 0.0004959995702770555, 'samples': 2004480, 'steps': 10439, 'loss/train': 1.9467318058013916} +11/06/2021 22:41:49 - INFO - __main__ - Step 10441: {'lr': 0.0004959986246767913, 'samples': 2004672, 'steps': 10440, 'loss/train': 2.24183988571167} +11/06/2021 22:41:49 - INFO - __main__ - Step 10442: {'lr': 0.0004959976789656838, 'samples': 2004864, 'steps': 10441, 'loss/train': 1.8617457151412964} +11/06/2021 22:41:50 - INFO - __main__ - Step 10443: {'lr': 0.0004959967331437336, 'samples': 2005056, 'steps': 10442, 'loss/train': 2.394559621810913} +11/06/2021 22:41:51 - INFO - __main__ - Step 10444: {'lr': 0.0004959957872109411, 'samples': 2005248, 'steps': 10443, 'loss/train': 2.127652168273926} +11/06/2021 22:41:51 - INFO - __main__ - Step 10445: {'lr': 0.0004959948411673066, 'samples': 2005440, 'steps': 10444, 'loss/train': 1.733871579170227} +11/06/2021 22:41:51 - INFO - __main__ - Step 10446: {'lr': 0.0004959938950128308, 'samples': 2005632, 'steps': 10445, 'loss/train': 1.8825232982635498} +11/06/2021 22:41:52 - INFO - __main__ - Step 10447: {'lr': 0.0004959929487475138, 'samples': 2005824, 'steps': 10446, 'loss/train': 1.3970377445220947} +11/06/2021 22:41:52 - INFO - __main__ - Step 10448: {'lr': 0.0004959920023713563, 'samples': 2006016, 'steps': 10447, 'loss/train': 1.3850414752960205} +11/06/2021 22:41:52 - INFO - __main__ - Step 10449: {'lr': 0.0004959910558843584, 'samples': 2006208, 'steps': 10448, 'loss/train': 1.893357753753662} +11/06/2021 22:41:54 - INFO - __main__ - Step 10450: {'lr': 0.0004959901092865208, 'samples': 2006400, 'steps': 10449, 'loss/train': 1.3027065992355347} +11/06/2021 22:41:54 - INFO - __main__ - Step 10451: {'lr': 0.0004959891625778438, 'samples': 2006592, 'steps': 10450, 'loss/train': 2.1753814220428467} +11/06/2021 22:41:54 - INFO - __main__ - Step 10452: {'lr': 0.0004959882157583281, 'samples': 2006784, 'steps': 10451, 'loss/train': 1.65367591381073} +11/06/2021 22:41:55 - INFO - __main__ - Step 10453: {'lr': 0.0004959872688279737, 'samples': 2006976, 'steps': 10452, 'loss/train': 1.8160592317581177} +11/06/2021 22:41:55 - INFO - __main__ - Step 10454: {'lr': 0.0004959863217867814, 'samples': 2007168, 'steps': 10453, 'loss/train': 1.6027116775512695} +11/06/2021 22:41:56 - INFO - __main__ - Step 10455: {'lr': 0.0004959853746347513, 'samples': 2007360, 'steps': 10454, 'loss/train': 1.9197403192520142} +11/06/2021 22:41:57 - INFO - __main__ - Step 10456: {'lr': 0.0004959844273718841, 'samples': 2007552, 'steps': 10455, 'loss/train': 1.6267117261886597} +11/06/2021 22:41:57 - INFO - __main__ - Step 10457: {'lr': 0.00049598347999818, 'samples': 2007744, 'steps': 10456, 'loss/train': 1.6874116659164429} +11/06/2021 22:41:58 - INFO - __main__ - Step 10458: {'lr': 0.0004959825325136396, 'samples': 2007936, 'steps': 10457, 'loss/train': 1.9572356939315796} +11/06/2021 22:41:58 - INFO - __main__ - Step 10459: {'lr': 0.0004959815849182633, 'samples': 2008128, 'steps': 10458, 'loss/train': 1.2736876010894775} +11/06/2021 22:41:58 - INFO - __main__ - Step 10460: {'lr': 0.0004959806372120515, 'samples': 2008320, 'steps': 10459, 'loss/train': 1.9439113140106201} +11/06/2021 22:41:59 - INFO - __main__ - Step 10461: {'lr': 0.0004959796893950045, 'samples': 2008512, 'steps': 10460, 'loss/train': 2.2238245010375977} +11/06/2021 22:42:00 - INFO - __main__ - Step 10462: {'lr': 0.0004959787414671229, 'samples': 2008704, 'steps': 10461, 'loss/train': 1.8460416793823242} +11/06/2021 22:42:00 - INFO - __main__ - Step 10463: {'lr': 0.000495977793428407, 'samples': 2008896, 'steps': 10462, 'loss/train': 1.9288679361343384} +11/06/2021 22:42:00 - INFO - __main__ - Step 10464: {'lr': 0.0004959768452788575, 'samples': 2009088, 'steps': 10463, 'loss/train': 1.7732502222061157} +11/06/2021 22:42:01 - INFO - __main__ - Step 10465: {'lr': 0.0004959758970184745, 'samples': 2009280, 'steps': 10464, 'loss/train': 2.398732900619507} +11/06/2021 22:42:02 - INFO - __main__ - Step 10466: {'lr': 0.0004959749486472587, 'samples': 2009472, 'steps': 10465, 'loss/train': 1.7253568172454834} +11/06/2021 22:42:02 - INFO - __main__ - Step 10467: {'lr': 0.0004959740001652102, 'samples': 2009664, 'steps': 10466, 'loss/train': 1.70595121383667} +11/06/2021 22:42:02 - INFO - __main__ - Step 10468: {'lr': 0.0004959730515723298, 'samples': 2009856, 'steps': 10467, 'loss/train': 1.9712741374969482} +11/06/2021 22:42:03 - INFO - __main__ - Step 10469: {'lr': 0.0004959721028686175, 'samples': 2010048, 'steps': 10468, 'loss/train': 1.4620518684387207} +11/06/2021 22:42:03 - INFO - __main__ - Step 10470: {'lr': 0.0004959711540540741, 'samples': 2010240, 'steps': 10469, 'loss/train': 1.9116092920303345} +11/06/2021 22:42:04 - INFO - __main__ - Step 10471: {'lr': 0.0004959702051286999, 'samples': 2010432, 'steps': 10470, 'loss/train': 2.0080511569976807} +11/06/2021 22:42:04 - INFO - __main__ - Step 10472: {'lr': 0.0004959692560924954, 'samples': 2010624, 'steps': 10471, 'loss/train': 1.8201708793640137} +11/06/2021 22:42:05 - INFO - __main__ - Step 10473: {'lr': 0.0004959683069454608, 'samples': 2010816, 'steps': 10472, 'loss/train': 1.4937697649002075} +11/06/2021 22:42:05 - INFO - __main__ - Step 10474: {'lr': 0.0004959673576875967, 'samples': 2011008, 'steps': 10473, 'loss/train': 1.4996908903121948} +11/06/2021 22:42:06 - INFO - __main__ - Step 10475: {'lr': 0.0004959664083189035, 'samples': 2011200, 'steps': 10474, 'loss/train': 1.8766359090805054} +11/06/2021 22:42:07 - INFO - __main__ - Step 10476: {'lr': 0.0004959654588393818, 'samples': 2011392, 'steps': 10475, 'loss/train': 2.539846181869507} +11/06/2021 22:42:07 - INFO - __main__ - Step 10477: {'lr': 0.0004959645092490316, 'samples': 2011584, 'steps': 10476, 'loss/train': 2.0664992332458496} +11/06/2021 22:42:07 - INFO - __main__ - Step 10478: {'lr': 0.0004959635595478537, 'samples': 2011776, 'steps': 10477, 'loss/train': 2.1357581615448} +11/06/2021 22:42:08 - INFO - __main__ - Step 10479: {'lr': 0.0004959626097358485, 'samples': 2011968, 'steps': 10478, 'loss/train': 1.7041106224060059} +11/06/2021 22:42:08 - INFO - __main__ - Step 10480: {'lr': 0.0004959616598130162, 'samples': 2012160, 'steps': 10479, 'loss/train': 1.5367162227630615} +11/06/2021 22:42:09 - INFO - __main__ - Step 10481: {'lr': 0.0004959607097793575, 'samples': 2012352, 'steps': 10480, 'loss/train': 0.8361077904701233} +11/06/2021 22:42:09 - INFO - __main__ - Step 10482: {'lr': 0.0004959597596348726, 'samples': 2012544, 'steps': 10481, 'loss/train': 1.425622582435608} +11/06/2021 22:42:10 - INFO - __main__ - Step 10483: {'lr': 0.0004959588093795621, 'samples': 2012736, 'steps': 10482, 'loss/train': 1.8034032583236694} +11/06/2021 22:42:10 - INFO - __main__ - Step 10484: {'lr': 0.0004959578590134262, 'samples': 2012928, 'steps': 10483, 'loss/train': 1.7551143169403076} +11/06/2021 22:42:10 - INFO - __main__ - Step 10485: {'lr': 0.0004959569085364657, 'samples': 2013120, 'steps': 10484, 'loss/train': 1.8540403842926025} +11/06/2021 22:42:11 - INFO - __main__ - Step 10486: {'lr': 0.0004959559579486807, 'samples': 2013312, 'steps': 10485, 'loss/train': 1.9935126304626465} +11/06/2021 22:42:12 - INFO - __main__ - Step 10487: {'lr': 0.0004959550072500718, 'samples': 2013504, 'steps': 10486, 'loss/train': 1.6862492561340332} +11/06/2021 22:42:12 - INFO - __main__ - Step 10488: {'lr': 0.0004959540564406393, 'samples': 2013696, 'steps': 10487, 'loss/train': 1.781096339225769} +11/06/2021 22:42:12 - INFO - __main__ - Step 10489: {'lr': 0.0004959531055203837, 'samples': 2013888, 'steps': 10488, 'loss/train': 1.8593416213989258} +11/06/2021 22:42:13 - INFO - __main__ - Step 10490: {'lr': 0.0004959521544893055, 'samples': 2014080, 'steps': 10489, 'loss/train': 1.739823579788208} +11/06/2021 22:42:13 - INFO - __main__ - Step 10491: {'lr': 0.000495951203347405, 'samples': 2014272, 'steps': 10490, 'loss/train': 1.9146326780319214} +11/06/2021 22:42:14 - INFO - __main__ - Step 10492: {'lr': 0.0004959502520946827, 'samples': 2014464, 'steps': 10491, 'loss/train': 2.1610023975372314} +11/06/2021 22:42:14 - INFO - __main__ - Step 10493: {'lr': 0.000495949300731139, 'samples': 2014656, 'steps': 10492, 'loss/train': 1.6168802976608276} +11/06/2021 22:42:15 - INFO - __main__ - Step 10494: {'lr': 0.0004959483492567744, 'samples': 2014848, 'steps': 10493, 'loss/train': 1.6835715770721436} +11/06/2021 22:42:15 - INFO - __main__ - Step 10495: {'lr': 0.0004959473976715892, 'samples': 2015040, 'steps': 10494, 'loss/train': 1.6348047256469727} +11/06/2021 22:42:15 - INFO - __main__ - Step 10496: {'lr': 0.0004959464459755839, 'samples': 2015232, 'steps': 10495, 'loss/train': 1.2869349718093872} +11/06/2021 22:42:17 - INFO - __main__ - Step 10497: {'lr': 0.0004959454941687589, 'samples': 2015424, 'steps': 10496, 'loss/train': 1.733815312385559} +11/06/2021 22:42:17 - INFO - __main__ - Step 10498: {'lr': 0.0004959445422511148, 'samples': 2015616, 'steps': 10497, 'loss/train': 1.9846241474151611} +11/06/2021 22:42:17 - INFO - __main__ - Step 10499: {'lr': 0.0004959435902226517, 'samples': 2015808, 'steps': 10498, 'loss/train': 0.9969847202301025} +11/06/2021 22:42:18 - INFO - __main__ - Step 10500: {'lr': 0.0004959426380833703, 'samples': 2016000, 'steps': 10499, 'loss/train': 1.6832598447799683} +11/06/2021 22:42:18 - INFO - __main__ - Step 10501: {'lr': 0.0004959416858332709, 'samples': 2016192, 'steps': 10500, 'loss/train': 1.6795216798782349} +11/06/2021 22:42:19 - INFO - __main__ - Step 10502: {'lr': 0.000495940733472354, 'samples': 2016384, 'steps': 10501, 'loss/train': 2.3554139137268066} +11/06/2021 22:42:19 - INFO - __main__ - Step 10503: {'lr': 0.00049593978100062, 'samples': 2016576, 'steps': 10502, 'loss/train': 1.8953803777694702} +11/06/2021 22:42:20 - INFO - __main__ - Step 10504: {'lr': 0.0004959388284180694, 'samples': 2016768, 'steps': 10503, 'loss/train': 2.1253671646118164} +11/06/2021 22:42:20 - INFO - __main__ - Step 10505: {'lr': 0.0004959378757247024, 'samples': 2016960, 'steps': 10504, 'loss/train': 1.8000476360321045} +11/06/2021 22:42:20 - INFO - __main__ - Step 10506: {'lr': 0.0004959369229205197, 'samples': 2017152, 'steps': 10505, 'loss/train': 0.36025920510292053} +11/06/2021 22:42:21 - INFO - __main__ - Step 10507: {'lr': 0.0004959359700055216, 'samples': 2017344, 'steps': 10506, 'loss/train': 1.7624599933624268} +11/06/2021 22:42:22 - INFO - __main__ - Step 10508: {'lr': 0.0004959350169797085, 'samples': 2017536, 'steps': 10507, 'loss/train': 1.786071538925171} +11/06/2021 22:42:22 - INFO - __main__ - Step 10509: {'lr': 0.000495934063843081, 'samples': 2017728, 'steps': 10508, 'loss/train': 2.0693178176879883} +11/06/2021 22:42:23 - INFO - __main__ - Step 10510: {'lr': 0.0004959331105956393, 'samples': 2017920, 'steps': 10509, 'loss/train': 1.65921950340271} +11/06/2021 22:42:23 - INFO - __main__ - Step 10511: {'lr': 0.000495932157237384, 'samples': 2018112, 'steps': 10510, 'loss/train': 1.9849227666854858} +11/06/2021 22:42:23 - INFO - __main__ - Step 10512: {'lr': 0.0004959312037683154, 'samples': 2018304, 'steps': 10511, 'loss/train': 1.6077988147735596} +11/06/2021 22:42:24 - INFO - __main__ - Step 10513: {'lr': 0.0004959302501884341, 'samples': 2018496, 'steps': 10512, 'loss/train': 1.6553412675857544} +11/06/2021 22:42:25 - INFO - __main__ - Step 10514: {'lr': 0.0004959292964977403, 'samples': 2018688, 'steps': 10513, 'loss/train': 1.3393796682357788} +11/06/2021 22:42:25 - INFO - __main__ - Step 10515: {'lr': 0.0004959283426962345, 'samples': 2018880, 'steps': 10514, 'loss/train': 1.1275650262832642} +11/06/2021 22:42:25 - INFO - __main__ - Step 10516: {'lr': 0.0004959273887839175, 'samples': 2019072, 'steps': 10515, 'loss/train': 1.4780120849609375} +11/06/2021 22:42:26 - INFO - __main__ - Step 10517: {'lr': 0.000495926434760789, 'samples': 2019264, 'steps': 10516, 'loss/train': 1.8599119186401367} +11/06/2021 22:42:27 - INFO - __main__ - Step 10518: {'lr': 0.0004959254806268501, 'samples': 2019456, 'steps': 10517, 'loss/train': 1.910403847694397} +11/06/2021 22:42:27 - INFO - __main__ - Step 10519: {'lr': 0.0004959245263821009, 'samples': 2019648, 'steps': 10518, 'loss/train': 1.8654783964157104} +11/06/2021 22:42:27 - INFO - __main__ - Step 10520: {'lr': 0.0004959235720265419, 'samples': 2019840, 'steps': 10519, 'loss/train': 1.3041726350784302} +11/06/2021 22:42:28 - INFO - __main__ - Step 10521: {'lr': 0.0004959226175601736, 'samples': 2020032, 'steps': 10520, 'loss/train': 1.7402362823486328} +11/06/2021 22:42:28 - INFO - __main__ - Step 10522: {'lr': 0.0004959216629829964, 'samples': 2020224, 'steps': 10521, 'loss/train': 1.8779191970825195} +11/06/2021 22:42:29 - INFO - __main__ - Step 10523: {'lr': 0.0004959207082950105, 'samples': 2020416, 'steps': 10522, 'loss/train': 1.9938749074935913} +11/06/2021 22:42:29 - INFO - __main__ - Step 10524: {'lr': 0.0004959197534962166, 'samples': 2020608, 'steps': 10523, 'loss/train': 1.7240444421768188} +11/06/2021 22:42:30 - INFO - __main__ - Step 10525: {'lr': 0.0004959187985866152, 'samples': 2020800, 'steps': 10524, 'loss/train': 1.3333297967910767} +11/06/2021 22:42:30 - INFO - __main__ - Step 10526: {'lr': 0.0004959178435662064, 'samples': 2020992, 'steps': 10525, 'loss/train': 3.172778606414795} +11/06/2021 22:42:30 - INFO - __main__ - Step 10527: {'lr': 0.0004959168884349909, 'samples': 2021184, 'steps': 10526, 'loss/train': 2.005765438079834} +11/06/2021 22:42:32 - INFO - __main__ - Step 10528: {'lr': 0.0004959159331929691, 'samples': 2021376, 'steps': 10527, 'loss/train': 1.9616241455078125} +11/06/2021 22:42:32 - INFO - __main__ - Step 10529: {'lr': 0.0004959149778401412, 'samples': 2021568, 'steps': 10528, 'loss/train': 0.44385576248168945} +11/06/2021 22:42:32 - INFO - __main__ - Step 10530: {'lr': 0.000495914022376508, 'samples': 2021760, 'steps': 10529, 'loss/train': 1.7894715070724487} +11/06/2021 22:42:33 - INFO - __main__ - Step 10531: {'lr': 0.0004959130668020696, 'samples': 2021952, 'steps': 10530, 'loss/train': 1.43883216381073} +11/06/2021 22:42:33 - INFO - __main__ - Step 10532: {'lr': 0.0004959121111168266, 'samples': 2022144, 'steps': 10531, 'loss/train': 1.801062822341919} +11/06/2021 22:42:34 - INFO - __main__ - Step 10533: {'lr': 0.0004959111553207794, 'samples': 2022336, 'steps': 10532, 'loss/train': 1.905466914176941} +11/06/2021 22:42:34 - INFO - __main__ - Step 10534: {'lr': 0.0004959101994139284, 'samples': 2022528, 'steps': 10533, 'loss/train': 1.9462462663650513} +11/06/2021 22:42:35 - INFO - __main__ - Step 10535: {'lr': 0.0004959092433962742, 'samples': 2022720, 'steps': 10534, 'loss/train': 1.9173693656921387} +11/06/2021 22:42:35 - INFO - __main__ - Step 10536: {'lr': 0.0004959082872678169, 'samples': 2022912, 'steps': 10535, 'loss/train': 0.9070050716400146} +11/06/2021 22:42:35 - INFO - __main__ - Step 10537: {'lr': 0.0004959073310285572, 'samples': 2023104, 'steps': 10536, 'loss/train': 1.65950345993042} +11/06/2021 22:42:37 - INFO - __main__ - Step 10538: {'lr': 0.0004959063746784955, 'samples': 2023296, 'steps': 10537, 'loss/train': 1.9055320024490356} +11/06/2021 22:42:37 - INFO - __main__ - Step 10539: {'lr': 0.0004959054182176321, 'samples': 2023488, 'steps': 10538, 'loss/train': 1.639905333518982} +11/06/2021 22:42:38 - INFO - __main__ - Step 10540: {'lr': 0.0004959044616459676, 'samples': 2023680, 'steps': 10539, 'loss/train': 1.4272217750549316} +11/06/2021 22:42:38 - INFO - __main__ - Step 10541: {'lr': 0.0004959035049635023, 'samples': 2023872, 'steps': 10540, 'loss/train': 0.9154389500617981} +11/06/2021 22:42:38 - INFO - __main__ - Step 10542: {'lr': 0.0004959025481702366, 'samples': 2024064, 'steps': 10541, 'loss/train': 1.519034504890442} +11/06/2021 22:42:39 - INFO - __main__ - Step 10543: {'lr': 0.0004959015912661712, 'samples': 2024256, 'steps': 10542, 'loss/train': 1.571833848953247} +11/06/2021 22:42:40 - INFO - __main__ - Step 10544: {'lr': 0.0004959006342513062, 'samples': 2024448, 'steps': 10543, 'loss/train': 0.902131974697113} +11/06/2021 22:42:40 - INFO - __main__ - Step 10545: {'lr': 0.0004958996771256422, 'samples': 2024640, 'steps': 10544, 'loss/train': 1.765254259109497} +11/06/2021 22:42:40 - INFO - __main__ - Step 10546: {'lr': 0.0004958987198891796, 'samples': 2024832, 'steps': 10545, 'loss/train': 1.8613026142120361} +11/06/2021 22:42:41 - INFO - __main__ - Step 10547: {'lr': 0.0004958977625419187, 'samples': 2025024, 'steps': 10546, 'loss/train': 1.9227455854415894} +11/06/2021 22:42:41 - INFO - __main__ - Step 10548: {'lr': 0.0004958968050838603, 'samples': 2025216, 'steps': 10547, 'loss/train': 1.920836091041565} +11/06/2021 22:42:42 - INFO - __main__ - Step 10549: {'lr': 0.0004958958475150044, 'samples': 2025408, 'steps': 10548, 'loss/train': 1.9864680767059326} +11/06/2021 22:42:43 - INFO - __main__ - Step 10550: {'lr': 0.0004958948898353516, 'samples': 2025600, 'steps': 10549, 'loss/train': 1.8649414777755737} +11/06/2021 22:42:43 - INFO - __main__ - Step 10551: {'lr': 0.0004958939320449026, 'samples': 2025792, 'steps': 10550, 'loss/train': 2.0411078929901123} +11/06/2021 22:42:43 - INFO - __main__ - Step 10552: {'lr': 0.0004958929741436574, 'samples': 2025984, 'steps': 10551, 'loss/train': 1.3231031894683838} +11/06/2021 22:42:44 - INFO - __main__ - Step 10553: {'lr': 0.0004958920161316167, 'samples': 2026176, 'steps': 10552, 'loss/train': 1.855413556098938} +11/06/2021 22:42:45 - INFO - __main__ - Step 10554: {'lr': 0.0004958910580087808, 'samples': 2026368, 'steps': 10553, 'loss/train': 2.308320999145508} +11/06/2021 22:42:45 - INFO - __main__ - Step 10555: {'lr': 0.0004958900997751502, 'samples': 2026560, 'steps': 10554, 'loss/train': 1.9437730312347412} +11/06/2021 22:42:45 - INFO - __main__ - Step 10556: {'lr': 0.0004958891414307253, 'samples': 2026752, 'steps': 10555, 'loss/train': 2.246142864227295} +11/06/2021 22:42:46 - INFO - __main__ - Step 10557: {'lr': 0.0004958881829755066, 'samples': 2026944, 'steps': 10556, 'loss/train': 2.26411771774292} +11/06/2021 22:42:46 - INFO - __main__ - Step 10558: {'lr': 0.0004958872244094944, 'samples': 2027136, 'steps': 10557, 'loss/train': 1.6010162830352783} +11/06/2021 22:42:46 - INFO - __main__ - Step 10559: {'lr': 0.0004958862657326893, 'samples': 2027328, 'steps': 10558, 'loss/train': 1.5600662231445312} +11/06/2021 22:42:48 - INFO - __main__ - Step 10560: {'lr': 0.0004958853069450916, 'samples': 2027520, 'steps': 10559, 'loss/train': 1.8983862400054932} +11/06/2021 22:42:48 - INFO - __main__ - Step 10561: {'lr': 0.0004958843480467017, 'samples': 2027712, 'steps': 10560, 'loss/train': 0.7014676332473755} +11/06/2021 22:42:48 - INFO - __main__ - Step 10562: {'lr': 0.0004958833890375202, 'samples': 2027904, 'steps': 10561, 'loss/train': 1.9279460906982422} +11/06/2021 22:42:49 - INFO - __main__ - Step 10563: {'lr': 0.0004958824299175474, 'samples': 2028096, 'steps': 10562, 'loss/train': 1.799846887588501} +11/06/2021 22:42:49 - INFO - __main__ - Step 10564: {'lr': 0.0004958814706867838, 'samples': 2028288, 'steps': 10563, 'loss/train': 1.8568742275238037} +11/06/2021 22:42:50 - INFO - __main__ - Step 10565: {'lr': 0.0004958805113452298, 'samples': 2028480, 'steps': 10564, 'loss/train': 1.6105812788009644} +11/06/2021 22:42:50 - INFO - __main__ - Step 10566: {'lr': 0.0004958795518928858, 'samples': 2028672, 'steps': 10565, 'loss/train': 1.1961236000061035} +11/06/2021 22:42:51 - INFO - __main__ - Step 10567: {'lr': 0.0004958785923297522, 'samples': 2028864, 'steps': 10566, 'loss/train': 1.8169901371002197} +11/06/2021 22:42:51 - INFO - __main__ - Step 10568: {'lr': 0.0004958776326558298, 'samples': 2029056, 'steps': 10567, 'loss/train': 1.83092200756073} +11/06/2021 22:42:51 - INFO - __main__ - Step 10569: {'lr': 0.0004958766728711184, 'samples': 2029248, 'steps': 10568, 'loss/train': 1.380372166633606} +11/06/2021 22:42:52 - INFO - __main__ - Step 10570: {'lr': 0.000495875712975619, 'samples': 2029440, 'steps': 10569, 'loss/train': 1.897265076637268} +11/06/2021 22:42:53 - INFO - __main__ - Step 10571: {'lr': 0.0004958747529693316, 'samples': 2029632, 'steps': 10570, 'loss/train': 1.3889024257659912} +11/06/2021 22:42:53 - INFO - __main__ - Step 10572: {'lr': 0.000495873792852257, 'samples': 2029824, 'steps': 10571, 'loss/train': 1.0971200466156006} +11/06/2021 22:42:53 - INFO - __main__ - Step 10573: {'lr': 0.0004958728326243954, 'samples': 2030016, 'steps': 10572, 'loss/train': 1.5941991806030273} +11/06/2021 22:42:54 - INFO - __main__ - Step 10574: {'lr': 0.0004958718722857473, 'samples': 2030208, 'steps': 10573, 'loss/train': 1.6007957458496094} +11/06/2021 22:42:55 - INFO - __main__ - Step 10575: {'lr': 0.0004958709118363131, 'samples': 2030400, 'steps': 10574, 'loss/train': 1.9947025775909424} +11/06/2021 22:42:55 - INFO - __main__ - Step 10576: {'lr': 0.0004958699512760933, 'samples': 2030592, 'steps': 10575, 'loss/train': 1.9763280153274536} +11/06/2021 22:42:55 - INFO - __main__ - Step 10577: {'lr': 0.0004958689906050882, 'samples': 2030784, 'steps': 10576, 'loss/train': 1.577843189239502} +11/06/2021 22:42:56 - INFO - __main__ - Step 10578: {'lr': 0.0004958680298232983, 'samples': 2030976, 'steps': 10577, 'loss/train': 1.4245156049728394} +11/06/2021 22:42:56 - INFO - __main__ - Step 10579: {'lr': 0.0004958670689307242, 'samples': 2031168, 'steps': 10578, 'loss/train': 2.1011838912963867} +11/06/2021 22:42:57 - INFO - __main__ - Step 10580: {'lr': 0.0004958661079273662, 'samples': 2031360, 'steps': 10579, 'loss/train': 1.68887197971344} +11/06/2021 22:42:58 - INFO - __main__ - Step 10581: {'lr': 0.0004958651468132246, 'samples': 2031552, 'steps': 10580, 'loss/train': 1.6149951219558716} +11/06/2021 22:42:58 - INFO - __main__ - Step 10582: {'lr': 0.0004958641855883001, 'samples': 2031744, 'steps': 10581, 'loss/train': 1.577684760093689} +11/06/2021 22:42:58 - INFO - __main__ - Step 10583: {'lr': 0.0004958632242525929, 'samples': 2031936, 'steps': 10582, 'loss/train': 1.9628639221191406} +11/06/2021 22:42:59 - INFO - __main__ - Step 10584: {'lr': 0.0004958622628061035, 'samples': 2032128, 'steps': 10583, 'loss/train': 1.6041213274002075} +11/06/2021 22:42:59 - INFO - __main__ - Step 10585: {'lr': 0.0004958613012488324, 'samples': 2032320, 'steps': 10584, 'loss/train': 0.9554458856582642} +11/06/2021 22:43:00 - INFO - __main__ - Step 10586: {'lr': 0.00049586033958078, 'samples': 2032512, 'steps': 10585, 'loss/train': 2.0318799018859863} +11/06/2021 22:43:00 - INFO - __main__ - Step 10587: {'lr': 0.0004958593778019468, 'samples': 2032704, 'steps': 10586, 'loss/train': 1.9779229164123535} +11/06/2021 22:43:01 - INFO - __main__ - Step 10588: {'lr': 0.0004958584159123331, 'samples': 2032896, 'steps': 10587, 'loss/train': 2.021127939224243} +11/06/2021 22:43:01 - INFO - __main__ - Step 10589: {'lr': 0.0004958574539119392, 'samples': 2033088, 'steps': 10588, 'loss/train': 1.864471435546875} +11/06/2021 22:43:01 - INFO - __main__ - Step 10590: {'lr': 0.0004958564918007659, 'samples': 2033280, 'steps': 10589, 'loss/train': 0.6293484568595886} +11/06/2021 22:43:03 - INFO - __main__ - Step 10591: {'lr': 0.0004958555295788135, 'samples': 2033472, 'steps': 10590, 'loss/train': 1.892540454864502} +11/06/2021 22:43:03 - INFO - __main__ - Step 10592: {'lr': 0.0004958545672460824, 'samples': 2033664, 'steps': 10591, 'loss/train': 2.0386414527893066} +11/06/2021 22:43:03 - INFO - __main__ - Step 10593: {'lr': 0.0004958536048025729, 'samples': 2033856, 'steps': 10592, 'loss/train': 2.018533706665039} +11/06/2021 22:43:04 - INFO - __main__ - Step 10594: {'lr': 0.0004958526422482857, 'samples': 2034048, 'steps': 10593, 'loss/train': 1.8704800605773926} +11/06/2021 22:43:04 - INFO - __main__ - Step 10595: {'lr': 0.000495851679583221, 'samples': 2034240, 'steps': 10594, 'loss/train': 1.2096422910690308} +11/06/2021 22:43:05 - INFO - __main__ - Step 10596: {'lr': 0.0004958507168073793, 'samples': 2034432, 'steps': 10595, 'loss/train': 1.69189453125} +11/06/2021 22:43:05 - INFO - __main__ - Step 10597: {'lr': 0.0004958497539207611, 'samples': 2034624, 'steps': 10596, 'loss/train': 1.6835681200027466} +11/06/2021 22:43:06 - INFO - __main__ - Step 10598: {'lr': 0.0004958487909233669, 'samples': 2034816, 'steps': 10597, 'loss/train': 1.550663948059082} +11/06/2021 22:43:06 - INFO - __main__ - Step 10599: {'lr': 0.0004958478278151969, 'samples': 2035008, 'steps': 10598, 'loss/train': 1.3910499811172485} +11/06/2021 22:43:06 - INFO - __main__ - Step 10600: {'lr': 0.0004958468645962517, 'samples': 2035200, 'steps': 10599, 'loss/train': 0.5436376333236694} +11/06/2021 22:43:08 - INFO - __main__ - Step 10601: {'lr': 0.0004958459012665317, 'samples': 2035392, 'steps': 10600, 'loss/train': 1.8061374425888062} +11/06/2021 22:43:08 - INFO - __main__ - Step 10602: {'lr': 0.0004958449378260374, 'samples': 2035584, 'steps': 10601, 'loss/train': 1.4709066152572632} +11/06/2021 22:43:08 - INFO - __main__ - Step 10603: {'lr': 0.000495843974274769, 'samples': 2035776, 'steps': 10602, 'loss/train': 1.4589587450027466} +11/06/2021 22:43:09 - INFO - __main__ - Step 10604: {'lr': 0.0004958430106127272, 'samples': 2035968, 'steps': 10603, 'loss/train': 2.1720454692840576} +11/06/2021 22:43:09 - INFO - __main__ - Step 10605: {'lr': 0.0004958420468399123, 'samples': 2036160, 'steps': 10604, 'loss/train': 1.612654209136963} +11/06/2021 22:43:10 - INFO - __main__ - Step 10606: {'lr': 0.0004958410829563248, 'samples': 2036352, 'steps': 10605, 'loss/train': 1.6653211116790771} +11/06/2021 22:43:10 - INFO - __main__ - Step 10607: {'lr': 0.0004958401189619652, 'samples': 2036544, 'steps': 10606, 'loss/train': 1.9401401281356812} +11/06/2021 22:43:11 - INFO - __main__ - Step 10608: {'lr': 0.0004958391548568336, 'samples': 2036736, 'steps': 10607, 'loss/train': 2.150745391845703} +11/06/2021 22:43:11 - INFO - __main__ - Step 10609: {'lr': 0.0004958381906409308, 'samples': 2036928, 'steps': 10608, 'loss/train': 1.7484651803970337} +11/06/2021 22:43:11 - INFO - __main__ - Step 10610: {'lr': 0.0004958372263142571, 'samples': 2037120, 'steps': 10609, 'loss/train': 1.8919156789779663} +11/06/2021 22:43:12 - INFO - __main__ - Step 10611: {'lr': 0.0004958362618768129, 'samples': 2037312, 'steps': 10610, 'loss/train': 1.3154926300048828} +11/06/2021 22:43:14 - INFO - __main__ - Step 10612: {'lr': 0.0004958352973285987, 'samples': 2037504, 'steps': 10611, 'loss/train': 1.8000268936157227} +11/06/2021 22:43:14 - INFO - __main__ - Step 10613: {'lr': 0.000495834332669615, 'samples': 2037696, 'steps': 10612, 'loss/train': 0.241807758808136} +11/06/2021 22:43:15 - INFO - __main__ - Step 10614: {'lr': 0.0004958333678998622, 'samples': 2037888, 'steps': 10613, 'loss/train': 1.521072268486023} +11/06/2021 22:43:15 - INFO - __main__ - Step 10615: {'lr': 0.0004958324030193404, 'samples': 2038080, 'steps': 10614, 'loss/train': 1.6696323156356812} +11/06/2021 22:43:15 - INFO - __main__ - Step 10616: {'lr': 0.0004958314380280504, 'samples': 2038272, 'steps': 10615, 'loss/train': 1.4865412712097168} +11/06/2021 22:43:16 - INFO - __main__ - Step 10617: {'lr': 0.0004958304729259927, 'samples': 2038464, 'steps': 10616, 'loss/train': 1.9140490293502808} +11/06/2021 22:43:16 - INFO - __main__ - Step 10618: {'lr': 0.0004958295077131674, 'samples': 2038656, 'steps': 10617, 'loss/train': 1.3753329515457153} +11/06/2021 22:43:17 - INFO - __main__ - Step 10619: {'lr': 0.0004958285423895752, 'samples': 2038848, 'steps': 10618, 'loss/train': 1.8530157804489136} +11/06/2021 22:43:18 - INFO - __main__ - Step 10620: {'lr': 0.0004958275769552165, 'samples': 2039040, 'steps': 10619, 'loss/train': 1.2794376611709595} +11/06/2021 22:43:18 - INFO - __main__ - Step 10621: {'lr': 0.0004958266114100917, 'samples': 2039232, 'steps': 10620, 'loss/train': 1.9506590366363525} +11/06/2021 22:43:18 - INFO - __main__ - Step 10622: {'lr': 0.0004958256457542011, 'samples': 2039424, 'steps': 10621, 'loss/train': 1.7138190269470215} +11/06/2021 22:43:19 - INFO - __main__ - Step 10623: {'lr': 0.0004958246799875453, 'samples': 2039616, 'steps': 10622, 'loss/train': 1.564102292060852} +11/06/2021 22:43:19 - INFO - __main__ - Step 10624: {'lr': 0.0004958237141101247, 'samples': 2039808, 'steps': 10623, 'loss/train': 0.428017258644104} +11/06/2021 22:43:19 - INFO - __main__ - Step 10625: {'lr': 0.0004958227481219399, 'samples': 2040000, 'steps': 10624, 'loss/train': 1.5035067796707153} +11/06/2021 22:43:21 - INFO - __main__ - Step 10626: {'lr': 0.0004958217820229909, 'samples': 2040192, 'steps': 10625, 'loss/train': 1.7794239521026611} +11/06/2021 22:43:21 - INFO - __main__ - Step 10627: {'lr': 0.0004958208158132785, 'samples': 2040384, 'steps': 10626, 'loss/train': 1.4251916408538818} +11/06/2021 22:43:21 - INFO - __main__ - Step 10628: {'lr': 0.000495819849492803, 'samples': 2040576, 'steps': 10627, 'loss/train': 1.7260355949401855} +11/06/2021 22:43:22 - INFO - __main__ - Step 10629: {'lr': 0.0004958188830615649, 'samples': 2040768, 'steps': 10628, 'loss/train': 2.004051446914673} +11/06/2021 22:43:22 - INFO - __main__ - Step 10630: {'lr': 0.0004958179165195646, 'samples': 2040960, 'steps': 10629, 'loss/train': 1.7460932731628418} +11/06/2021 22:43:23 - INFO - __main__ - Step 10631: {'lr': 0.0004958169498668026, 'samples': 2041152, 'steps': 10630, 'loss/train': 1.8938854932785034} +11/06/2021 22:43:23 - INFO - __main__ - Step 10632: {'lr': 0.0004958159831032793, 'samples': 2041344, 'steps': 10631, 'loss/train': 1.446541428565979} +11/06/2021 22:43:24 - INFO - __main__ - Step 10633: {'lr': 0.000495815016228995, 'samples': 2041536, 'steps': 10632, 'loss/train': 1.7085440158843994} +11/06/2021 22:43:24 - INFO - __main__ - Step 10634: {'lr': 0.0004958140492439502, 'samples': 2041728, 'steps': 10633, 'loss/train': 1.8917224407196045} +11/06/2021 22:43:24 - INFO - __main__ - Step 10635: {'lr': 0.0004958130821481455, 'samples': 2041920, 'steps': 10634, 'loss/train': 1.9071261882781982} +11/06/2021 22:43:25 - INFO - __main__ - Step 10636: {'lr': 0.0004958121149415812, 'samples': 2042112, 'steps': 10635, 'loss/train': 1.352231502532959} +11/06/2021 22:43:26 - INFO - __main__ - Step 10637: {'lr': 0.0004958111476242577, 'samples': 2042304, 'steps': 10636, 'loss/train': 1.8399983644485474} +11/06/2021 22:43:26 - INFO - __main__ - Step 10638: {'lr': 0.0004958101801961755, 'samples': 2042496, 'steps': 10637, 'loss/train': 2.4199862480163574} +11/06/2021 22:43:26 - INFO - __main__ - Step 10639: {'lr': 0.0004958092126573352, 'samples': 2042688, 'steps': 10638, 'loss/train': 1.832000970840454} +11/06/2021 22:43:27 - INFO - __main__ - Step 10640: {'lr': 0.0004958082450077369, 'samples': 2042880, 'steps': 10639, 'loss/train': 2.0270063877105713} +11/06/2021 22:43:28 - INFO - __main__ - Step 10641: {'lr': 0.0004958072772473812, 'samples': 2043072, 'steps': 10640, 'loss/train': 1.655840277671814} +11/06/2021 22:43:28 - INFO - __main__ - Step 10642: {'lr': 0.0004958063093762684, 'samples': 2043264, 'steps': 10641, 'loss/train': 2.09566330909729} +11/06/2021 22:43:29 - INFO - __main__ - Step 10643: {'lr': 0.0004958053413943993, 'samples': 2043456, 'steps': 10642, 'loss/train': 1.8067339658737183} +11/06/2021 22:43:29 - INFO - __main__ - Step 10644: {'lr': 0.0004958043733017741, 'samples': 2043648, 'steps': 10643, 'loss/train': 1.5341635942459106} +11/06/2021 22:43:29 - INFO - __main__ - Step 10645: {'lr': 0.0004958034050983932, 'samples': 2043840, 'steps': 10644, 'loss/train': 1.7686036825180054} +11/06/2021 22:43:30 - INFO - __main__ - Step 10646: {'lr': 0.0004958024367842569, 'samples': 2044032, 'steps': 10645, 'loss/train': 1.8402926921844482} +11/06/2021 22:43:31 - INFO - __main__ - Step 10647: {'lr': 0.000495801468359366, 'samples': 2044224, 'steps': 10646, 'loss/train': 1.6536637544631958} +11/06/2021 22:43:31 - INFO - __main__ - Step 10648: {'lr': 0.0004958004998237207, 'samples': 2044416, 'steps': 10647, 'loss/train': 2.0047109127044678} +11/06/2021 22:43:31 - INFO - __main__ - Step 10649: {'lr': 0.0004957995311773215, 'samples': 2044608, 'steps': 10648, 'loss/train': 1.8218034505844116} +11/06/2021 22:43:32 - INFO - __main__ - Step 10650: {'lr': 0.0004957985624201688, 'samples': 2044800, 'steps': 10649, 'loss/train': 1.3269506692886353} +11/06/2021 22:43:32 - INFO - __main__ - Step 10651: {'lr': 0.0004957975935522632, 'samples': 2044992, 'steps': 10650, 'loss/train': 1.8232018947601318} +11/06/2021 22:43:33 - INFO - __main__ - Step 10652: {'lr': 0.0004957966245736048, 'samples': 2045184, 'steps': 10651, 'loss/train': 1.26266348361969} +11/06/2021 22:43:34 - INFO - __main__ - Step 10653: {'lr': 0.0004957956554841943, 'samples': 2045376, 'steps': 10652, 'loss/train': 1.7997419834136963} +11/06/2021 22:43:34 - INFO - __main__ - Step 10654: {'lr': 0.0004957946862840321, 'samples': 2045568, 'steps': 10653, 'loss/train': 1.7390581369400024} +11/06/2021 22:43:34 - INFO - __main__ - Step 10655: {'lr': 0.0004957937169731186, 'samples': 2045760, 'steps': 10654, 'loss/train': 1.672598958015442} +11/06/2021 22:43:35 - INFO - __main__ - Step 10656: {'lr': 0.0004957927475514542, 'samples': 2045952, 'steps': 10655, 'loss/train': 1.358737826347351} +11/06/2021 22:43:36 - INFO - __main__ - Step 10657: {'lr': 0.0004957917780190395, 'samples': 2046144, 'steps': 10656, 'loss/train': 1.9060399532318115} +11/06/2021 22:43:36 - INFO - __main__ - Step 10658: {'lr': 0.0004957908083758747, 'samples': 2046336, 'steps': 10657, 'loss/train': 1.6999403238296509} +11/06/2021 22:43:36 - INFO - __main__ - Step 10659: {'lr': 0.0004957898386219603, 'samples': 2046528, 'steps': 10658, 'loss/train': 1.6076505184173584} +11/06/2021 22:43:37 - INFO - __main__ - Step 10660: {'lr': 0.000495788868757297, 'samples': 2046720, 'steps': 10659, 'loss/train': 1.7159380912780762} +11/06/2021 22:43:37 - INFO - __main__ - Step 10661: {'lr': 0.0004957878987818849, 'samples': 2046912, 'steps': 10660, 'loss/train': 1.4848712682724} +11/06/2021 22:43:39 - INFO - __main__ - Step 10662: {'lr': 0.0004957869286957246, 'samples': 2047104, 'steps': 10661, 'loss/train': 1.9166350364685059} +11/06/2021 22:43:39 - INFO - __main__ - Step 10663: {'lr': 0.0004957859584988164, 'samples': 2047296, 'steps': 10662, 'loss/train': 1.3673206567764282} +11/06/2021 22:43:39 - INFO - __main__ - Step 10664: {'lr': 0.0004957849881911609, 'samples': 2047488, 'steps': 10663, 'loss/train': 1.7530118227005005} +11/06/2021 22:43:40 - INFO - __main__ - Step 10665: {'lr': 0.0004957840177727585, 'samples': 2047680, 'steps': 10664, 'loss/train': 1.5396183729171753} +11/06/2021 22:43:40 - INFO - __main__ - Step 10666: {'lr': 0.0004957830472436097, 'samples': 2047872, 'steps': 10665, 'loss/train': 2.27144718170166} +11/06/2021 22:43:40 - INFO - __main__ - Step 10667: {'lr': 0.0004957820766037147, 'samples': 2048064, 'steps': 10666, 'loss/train': 2.53610897064209} +11/06/2021 22:43:41 - INFO - __main__ - Step 10668: {'lr': 0.0004957811058530742, 'samples': 2048256, 'steps': 10667, 'loss/train': 2.2089219093322754} +11/06/2021 22:43:42 - INFO - __main__ - Step 10669: {'lr': 0.0004957801349916884, 'samples': 2048448, 'steps': 10668, 'loss/train': 2.4702768325805664} +11/06/2021 22:43:42 - INFO - __main__ - Step 10670: {'lr': 0.000495779164019558, 'samples': 2048640, 'steps': 10669, 'loss/train': 0.2976198196411133} +11/06/2021 22:43:42 - INFO - __main__ - Step 10671: {'lr': 0.0004957781929366832, 'samples': 2048832, 'steps': 10670, 'loss/train': 2.503723382949829} +11/06/2021 22:43:43 - INFO - __main__ - Step 10672: {'lr': 0.0004957772217430646, 'samples': 2049024, 'steps': 10671, 'loss/train': 1.338193416595459} +11/06/2021 22:43:44 - INFO - __main__ - Step 10673: {'lr': 0.0004957762504387025, 'samples': 2049216, 'steps': 10672, 'loss/train': 1.5494346618652344} +11/06/2021 22:43:45 - INFO - __main__ - Step 10674: {'lr': 0.0004957752790235976, 'samples': 2049408, 'steps': 10673, 'loss/train': 2.082453489303589} +11/06/2021 22:43:45 - INFO - __main__ - Step 10675: {'lr': 0.00049577430749775, 'samples': 2049600, 'steps': 10674, 'loss/train': 1.9406588077545166} +11/06/2021 22:43:45 - INFO - __main__ - Step 10676: {'lr': 0.0004957733358611602, 'samples': 2049792, 'steps': 10675, 'loss/train': 1.727967381477356} +11/06/2021 22:43:46 - INFO - __main__ - Step 10677: {'lr': 0.0004957723641138289, 'samples': 2049984, 'steps': 10676, 'loss/train': 1.9043892621994019} +11/06/2021 22:43:47 - INFO - __main__ - Step 10678: {'lr': 0.0004957713922557563, 'samples': 2050176, 'steps': 10677, 'loss/train': 1.6342339515686035} +11/06/2021 22:43:47 - INFO - __main__ - Step 10679: {'lr': 0.0004957704202869429, 'samples': 2050368, 'steps': 10678, 'loss/train': 2.188232898712158} +11/06/2021 22:43:47 - INFO - __main__ - Step 10680: {'lr': 0.0004957694482073891, 'samples': 2050560, 'steps': 10679, 'loss/train': 2.068922758102417} +11/06/2021 22:43:48 - INFO - __main__ - Step 10681: {'lr': 0.0004957684760170955, 'samples': 2050752, 'steps': 10680, 'loss/train': 1.8861031532287598} +11/06/2021 22:43:48 - INFO - __main__ - Step 10682: {'lr': 0.0004957675037160624, 'samples': 2050944, 'steps': 10681, 'loss/train': 1.979127049446106} +11/06/2021 22:43:49 - INFO - __main__ - Step 10683: {'lr': 0.0004957665313042902, 'samples': 2051136, 'steps': 10682, 'loss/train': 1.728943109512329} +11/06/2021 22:43:49 - INFO - __main__ - Step 10684: {'lr': 0.0004957655587817793, 'samples': 2051328, 'steps': 10683, 'loss/train': 1.295758605003357} +11/06/2021 22:43:50 - INFO - __main__ - Step 10685: {'lr': 0.0004957645861485304, 'samples': 2051520, 'steps': 10684, 'loss/train': 1.4567430019378662} +11/06/2021 22:43:50 - INFO - __main__ - Step 10686: {'lr': 0.0004957636134045437, 'samples': 2051712, 'steps': 10685, 'loss/train': 1.5401474237442017} +11/06/2021 22:43:50 - INFO - __main__ - Step 10687: {'lr': 0.0004957626405498196, 'samples': 2051904, 'steps': 10686, 'loss/train': 2.0036814212799072} +11/06/2021 22:43:51 - INFO - __main__ - Step 10688: {'lr': 0.0004957616675843588, 'samples': 2052096, 'steps': 10687, 'loss/train': 1.8221772909164429} +11/06/2021 22:43:52 - INFO - __main__ - Step 10689: {'lr': 0.0004957606945081615, 'samples': 2052288, 'steps': 10688, 'loss/train': 1.658942461013794} +11/06/2021 22:43:52 - INFO - __main__ - Step 10690: {'lr': 0.0004957597213212284, 'samples': 2052480, 'steps': 10689, 'loss/train': 1.7910033464431763} +11/06/2021 22:43:52 - INFO - __main__ - Step 10691: {'lr': 0.0004957587480235595, 'samples': 2052672, 'steps': 10690, 'loss/train': 1.7230714559555054} +11/06/2021 22:43:53 - INFO - __main__ - Step 10692: {'lr': 0.0004957577746151556, 'samples': 2052864, 'steps': 10691, 'loss/train': 1.9783008098602295} +11/06/2021 22:43:54 - INFO - __main__ - Step 10693: {'lr': 0.0004957568010960171, 'samples': 2053056, 'steps': 10692, 'loss/train': 1.6153764724731445} +11/06/2021 22:43:54 - INFO - __main__ - Step 10694: {'lr': 0.0004957558274661444, 'samples': 2053248, 'steps': 10693, 'loss/train': 1.5456531047821045} +11/06/2021 22:43:55 - INFO - __main__ - Step 10695: {'lr': 0.0004957548537255378, 'samples': 2053440, 'steps': 10694, 'loss/train': 2.194444417953491} +11/06/2021 22:43:55 - INFO - __main__ - Step 10696: {'lr': 0.000495753879874198, 'samples': 2053632, 'steps': 10695, 'loss/train': 1.8297362327575684} +11/06/2021 22:43:55 - INFO - __main__ - Step 10697: {'lr': 0.0004957529059121251, 'samples': 2053824, 'steps': 10696, 'loss/train': 2.081062078475952} +11/06/2021 22:43:56 - INFO - __main__ - Step 10698: {'lr': 0.0004957519318393199, 'samples': 2054016, 'steps': 10697, 'loss/train': 1.8401142358779907} +11/06/2021 22:43:57 - INFO - __main__ - Step 10699: {'lr': 0.0004957509576557826, 'samples': 2054208, 'steps': 10698, 'loss/train': 1.7377288341522217} +11/06/2021 22:43:57 - INFO - __main__ - Step 10700: {'lr': 0.0004957499833615137, 'samples': 2054400, 'steps': 10699, 'loss/train': 2.147418260574341} +11/06/2021 22:43:57 - INFO - __main__ - Step 10701: {'lr': 0.0004957490089565137, 'samples': 2054592, 'steps': 10700, 'loss/train': 1.7337613105773926} +11/06/2021 22:43:58 - INFO - __main__ - Step 10702: {'lr': 0.0004957480344407829, 'samples': 2054784, 'steps': 10701, 'loss/train': 1.7109180688858032} +11/06/2021 22:43:58 - INFO - __main__ - Step 10703: {'lr': 0.0004957470598143218, 'samples': 2054976, 'steps': 10702, 'loss/train': 1.4152930974960327} +11/06/2021 22:43:59 - INFO - __main__ - Step 10704: {'lr': 0.000495746085077131, 'samples': 2055168, 'steps': 10703, 'loss/train': 1.6608555316925049} +11/06/2021 22:44:00 - INFO - __main__ - Step 10705: {'lr': 0.0004957451102292108, 'samples': 2055360, 'steps': 10704, 'loss/train': 1.8776973485946655} +11/06/2021 22:44:00 - INFO - __main__ - Step 10706: {'lr': 0.0004957441352705616, 'samples': 2055552, 'steps': 10705, 'loss/train': 1.9885625839233398} +11/06/2021 22:44:00 - INFO - __main__ - Step 10707: {'lr': 0.0004957431602011839, 'samples': 2055744, 'steps': 10706, 'loss/train': 1.5255722999572754} +11/06/2021 22:44:01 - INFO - __main__ - Step 10708: {'lr': 0.0004957421850210781, 'samples': 2055936, 'steps': 10707, 'loss/train': 1.827954649925232} +11/06/2021 22:44:02 - INFO - __main__ - Step 10709: {'lr': 0.0004957412097302446, 'samples': 2056128, 'steps': 10708, 'loss/train': 2.0723941326141357} +11/06/2021 22:44:02 - INFO - __main__ - Step 10710: {'lr': 0.000495740234328684, 'samples': 2056320, 'steps': 10709, 'loss/train': 2.509693145751953} +11/06/2021 22:44:02 - INFO - __main__ - Step 10711: {'lr': 0.0004957392588163967, 'samples': 2056512, 'steps': 10710, 'loss/train': 1.9670145511627197} +11/06/2021 22:44:03 - INFO - __main__ - Step 10712: {'lr': 0.000495738283193383, 'samples': 2056704, 'steps': 10711, 'loss/train': 1.6758942604064941} +11/06/2021 22:44:03 - INFO - __main__ - Step 10713: {'lr': 0.0004957373074596434, 'samples': 2056896, 'steps': 10712, 'loss/train': 1.8210440874099731} +11/06/2021 22:44:04 - INFO - __main__ - Step 10714: {'lr': 0.0004957363316151784, 'samples': 2057088, 'steps': 10713, 'loss/train': 1.4150325059890747} +11/06/2021 22:44:04 - INFO - __main__ - Step 10715: {'lr': 0.0004957353556599884, 'samples': 2057280, 'steps': 10714, 'loss/train': 1.9680533409118652} +11/06/2021 22:44:05 - INFO - __main__ - Step 10716: {'lr': 0.0004957343795940738, 'samples': 2057472, 'steps': 10715, 'loss/train': 2.222113847732544} +11/06/2021 22:44:05 - INFO - __main__ - Step 10717: {'lr': 0.0004957334034174351, 'samples': 2057664, 'steps': 10716, 'loss/train': 1.4754172563552856} +11/06/2021 22:44:06 - INFO - __main__ - Step 10718: {'lr': 0.0004957324271300728, 'samples': 2057856, 'steps': 10717, 'loss/train': 1.6506346464157104} +11/06/2021 22:44:07 - INFO - __main__ - Step 10719: {'lr': 0.0004957314507319871, 'samples': 2058048, 'steps': 10718, 'loss/train': 1.6497141122817993} +11/06/2021 22:44:07 - INFO - __main__ - Step 10720: {'lr': 0.0004957304742231787, 'samples': 2058240, 'steps': 10719, 'loss/train': 1.7145750522613525} +11/06/2021 22:44:07 - INFO - __main__ - Step 10721: {'lr': 0.0004957294976036479, 'samples': 2058432, 'steps': 10720, 'loss/train': 1.7986055612564087} +11/06/2021 22:44:08 - INFO - __main__ - Step 10722: {'lr': 0.0004957285208733953, 'samples': 2058624, 'steps': 10721, 'loss/train': 1.592078447341919} +11/06/2021 22:44:08 - INFO - __main__ - Step 10723: {'lr': 0.0004957275440324211, 'samples': 2058816, 'steps': 10722, 'loss/train': 1.7179454565048218} +11/06/2021 22:44:09 - INFO - __main__ - Step 10724: {'lr': 0.0004957265670807258, 'samples': 2059008, 'steps': 10723, 'loss/train': 1.8023722171783447} +11/06/2021 22:44:09 - INFO - __main__ - Step 10725: {'lr': 0.0004957255900183101, 'samples': 2059200, 'steps': 10724, 'loss/train': 2.032273292541504} +11/06/2021 22:44:10 - INFO - __main__ - Step 10726: {'lr': 0.000495724612845174, 'samples': 2059392, 'steps': 10725, 'loss/train': 1.7515367269515991} +11/06/2021 22:44:10 - INFO - __main__ - Step 10727: {'lr': 0.0004957236355613184, 'samples': 2059584, 'steps': 10726, 'loss/train': 1.7511495351791382} +11/06/2021 22:44:10 - INFO - __main__ - Step 10728: {'lr': 0.0004957226581667434, 'samples': 2059776, 'steps': 10727, 'loss/train': 2.232154369354248} +11/06/2021 22:44:11 - INFO - __main__ - Step 10729: {'lr': 0.0004957216806614496, 'samples': 2059968, 'steps': 10728, 'loss/train': 2.1359822750091553} +11/06/2021 22:44:12 - INFO - __main__ - Step 10730: {'lr': 0.0004957207030454374, 'samples': 2060160, 'steps': 10729, 'loss/train': 2.018582582473755} +11/06/2021 22:44:12 - INFO - __main__ - Step 10731: {'lr': 0.0004957197253187073, 'samples': 2060352, 'steps': 10730, 'loss/train': 1.6088690757751465} +11/06/2021 22:44:12 - INFO - __main__ - Step 10732: {'lr': 0.0004957187474812595, 'samples': 2060544, 'steps': 10731, 'loss/train': 1.1297942399978638} +11/06/2021 22:44:13 - INFO - __main__ - Step 10733: {'lr': 0.0004957177695330948, 'samples': 2060736, 'steps': 10732, 'loss/train': 1.5375380516052246} +11/06/2021 22:44:13 - INFO - __main__ - Step 10734: {'lr': 0.0004957167914742134, 'samples': 2060928, 'steps': 10733, 'loss/train': 1.797157883644104} +11/06/2021 22:44:14 - INFO - __main__ - Step 10735: {'lr': 0.0004957158133046158, 'samples': 2061120, 'steps': 10734, 'loss/train': 2.323326587677002} +11/06/2021 22:44:15 - INFO - __main__ - Step 10736: {'lr': 0.0004957148350243025, 'samples': 2061312, 'steps': 10735, 'loss/train': 2.2027082443237305} +11/06/2021 22:44:15 - INFO - __main__ - Step 10737: {'lr': 0.0004957138566332738, 'samples': 2061504, 'steps': 10736, 'loss/train': 1.9741092920303345} +11/06/2021 22:44:15 - INFO - __main__ - Step 10738: {'lr': 0.0004957128781315303, 'samples': 2061696, 'steps': 10737, 'loss/train': 1.5470525026321411} +11/06/2021 22:44:16 - INFO - __main__ - Step 10739: {'lr': 0.0004957118995190723, 'samples': 2061888, 'steps': 10738, 'loss/train': 1.9221845865249634} +11/06/2021 22:44:17 - INFO - __main__ - Step 10740: {'lr': 0.0004957109207959004, 'samples': 2062080, 'steps': 10739, 'loss/train': 1.5594979524612427} +11/06/2021 22:44:17 - INFO - __main__ - Step 10741: {'lr': 0.0004957099419620149, 'samples': 2062272, 'steps': 10740, 'loss/train': 1.0245342254638672} +11/06/2021 22:44:17 - INFO - __main__ - Step 10742: {'lr': 0.0004957089630174163, 'samples': 2062464, 'steps': 10741, 'loss/train': 1.913503885269165} +11/06/2021 22:44:18 - INFO - __main__ - Step 10743: {'lr': 0.0004957079839621051, 'samples': 2062656, 'steps': 10742, 'loss/train': 2.051661968231201} +11/06/2021 22:44:18 - INFO - __main__ - Step 10744: {'lr': 0.0004957070047960816, 'samples': 2062848, 'steps': 10743, 'loss/train': 2.0730690956115723} +11/06/2021 22:44:19 - INFO - __main__ - Step 10745: {'lr': 0.0004957060255193462, 'samples': 2063040, 'steps': 10744, 'loss/train': 2.2329344749450684} +11/06/2021 22:44:19 - INFO - __main__ - Step 10746: {'lr': 0.0004957050461318997, 'samples': 2063232, 'steps': 10745, 'loss/train': 1.7052743434906006} +11/06/2021 22:44:20 - INFO - __main__ - Step 10747: {'lr': 0.0004957040666337422, 'samples': 2063424, 'steps': 10746, 'loss/train': 1.7934210300445557} +11/06/2021 22:44:20 - INFO - __main__ - Step 10748: {'lr': 0.0004957030870248742, 'samples': 2063616, 'steps': 10747, 'loss/train': 1.2029649019241333} +11/06/2021 22:44:21 - INFO - __main__ - Step 10749: {'lr': 0.0004957021073052962, 'samples': 2063808, 'steps': 10748, 'loss/train': 1.534114122390747} +11/06/2021 22:44:21 - INFO - __main__ - Step 10750: {'lr': 0.0004957011274750086, 'samples': 2064000, 'steps': 10749, 'loss/train': 0.9407898783683777} +11/06/2021 22:44:22 - INFO - __main__ - Step 10751: {'lr': 0.0004957001475340119, 'samples': 2064192, 'steps': 10750, 'loss/train': 1.5393911600112915} +11/06/2021 22:44:22 - INFO - __main__ - Step 10752: {'lr': 0.0004956991674823065, 'samples': 2064384, 'steps': 10751, 'loss/train': 1.8228400945663452} +11/06/2021 22:44:23 - INFO - __main__ - Step 10753: {'lr': 0.0004956981873198928, 'samples': 2064576, 'steps': 10752, 'loss/train': 1.507121205329895} +11/06/2021 22:44:23 - INFO - __main__ - Step 10754: {'lr': 0.0004956972070467712, 'samples': 2064768, 'steps': 10753, 'loss/train': 1.64657461643219} +11/06/2021 22:44:23 - INFO - __main__ - Step 10755: {'lr': 0.0004956962266629424, 'samples': 2064960, 'steps': 10754, 'loss/train': 1.6212588548660278} +11/06/2021 22:44:24 - INFO - __main__ - Step 10756: {'lr': 0.0004956952461684066, 'samples': 2065152, 'steps': 10755, 'loss/train': 2.1202139854431152} +11/06/2021 22:44:25 - INFO - __main__ - Step 10757: {'lr': 0.0004956942655631644, 'samples': 2065344, 'steps': 10756, 'loss/train': 1.5507880449295044} +11/06/2021 22:44:25 - INFO - __main__ - Step 10758: {'lr': 0.0004956932848472161, 'samples': 2065536, 'steps': 10757, 'loss/train': 1.8729193210601807} +11/06/2021 22:44:25 - INFO - __main__ - Step 10759: {'lr': 0.0004956923040205622, 'samples': 2065728, 'steps': 10758, 'loss/train': 1.7279722690582275} +11/06/2021 22:44:26 - INFO - __main__ - Step 10760: {'lr': 0.0004956913230832031, 'samples': 2065920, 'steps': 10759, 'loss/train': 2.134770154953003} +11/06/2021 22:44:27 - INFO - __main__ - Step 10761: {'lr': 0.0004956903420351393, 'samples': 2066112, 'steps': 10760, 'loss/train': 1.6158196926116943} +11/06/2021 22:44:28 - INFO - __main__ - Step 10762: {'lr': 0.0004956893608763713, 'samples': 2066304, 'steps': 10761, 'loss/train': 1.8567177057266235} +11/06/2021 22:44:28 - INFO - __main__ - Step 10763: {'lr': 0.0004956883796068993, 'samples': 2066496, 'steps': 10762, 'loss/train': 1.9238213300704956} +11/06/2021 22:44:28 - INFO - __main__ - Step 10764: {'lr': 0.000495687398226724, 'samples': 2066688, 'steps': 10763, 'loss/train': 1.661841869354248} +11/06/2021 22:44:29 - INFO - __main__ - Step 10765: {'lr': 0.0004956864167358458, 'samples': 2066880, 'steps': 10764, 'loss/train': 1.6980998516082764} +11/06/2021 22:44:29 - INFO - __main__ - Step 10766: {'lr': 0.000495685435134265, 'samples': 2067072, 'steps': 10765, 'loss/train': 1.7710494995117188} +11/06/2021 22:44:30 - INFO - __main__ - Step 10767: {'lr': 0.0004956844534219822, 'samples': 2067264, 'steps': 10766, 'loss/train': 1.8926702737808228} +11/06/2021 22:44:31 - INFO - __main__ - Step 10768: {'lr': 0.0004956834715989977, 'samples': 2067456, 'steps': 10767, 'loss/train': 1.8057781457901} +11/06/2021 22:44:31 - INFO - __main__ - Step 10769: {'lr': 0.0004956824896653122, 'samples': 2067648, 'steps': 10768, 'loss/train': 1.9344799518585205} +11/06/2021 22:44:31 - INFO - __main__ - Step 10770: {'lr': 0.0004956815076209257, 'samples': 2067840, 'steps': 10769, 'loss/train': 1.7666970491409302} +11/06/2021 22:44:32 - INFO - __main__ - Step 10771: {'lr': 0.0004956805254658391, 'samples': 2068032, 'steps': 10770, 'loss/train': 1.9876887798309326} +11/06/2021 22:44:32 - INFO - __main__ - Step 10772: {'lr': 0.0004956795432000526, 'samples': 2068224, 'steps': 10771, 'loss/train': 1.9097800254821777} +11/06/2021 22:44:33 - INFO - __main__ - Step 10773: {'lr': 0.0004956785608235667, 'samples': 2068416, 'steps': 10772, 'loss/train': 1.9691766500473022} +11/06/2021 22:44:33 - INFO - __main__ - Step 10774: {'lr': 0.0004956775783363817, 'samples': 2068608, 'steps': 10773, 'loss/train': 1.7181099653244019} +11/06/2021 22:44:34 - INFO - __main__ - Step 10775: {'lr': 0.0004956765957384984, 'samples': 2068800, 'steps': 10774, 'loss/train': 1.4132951498031616} +11/06/2021 22:44:34 - INFO - __main__ - Step 10776: {'lr': 0.0004956756130299169, 'samples': 2068992, 'steps': 10775, 'loss/train': 1.20347261428833} +11/06/2021 22:44:34 - INFO - __main__ - Step 10777: {'lr': 0.0004956746302106378, 'samples': 2069184, 'steps': 10776, 'loss/train': 1.4337294101715088} +11/06/2021 22:44:35 - INFO - __main__ - Step 10778: {'lr': 0.0004956736472806614, 'samples': 2069376, 'steps': 10777, 'loss/train': 1.8119988441467285} +11/06/2021 22:44:36 - INFO - __main__ - Step 10779: {'lr': 0.0004956726642399883, 'samples': 2069568, 'steps': 10778, 'loss/train': 1.28266179561615} +11/06/2021 22:44:36 - INFO - __main__ - Step 10780: {'lr': 0.0004956716810886189, 'samples': 2069760, 'steps': 10779, 'loss/train': 1.9151232242584229} +11/06/2021 22:44:36 - INFO - __main__ - Step 10781: {'lr': 0.0004956706978265536, 'samples': 2069952, 'steps': 10780, 'loss/train': 1.7361626625061035} +11/06/2021 22:44:37 - INFO - __main__ - Step 10782: {'lr': 0.0004956697144537929, 'samples': 2070144, 'steps': 10781, 'loss/train': 1.9696669578552246} +11/06/2021 22:44:38 - INFO - __main__ - Step 10783: {'lr': 0.0004956687309703372, 'samples': 2070336, 'steps': 10782, 'loss/train': 2.0651187896728516} +11/06/2021 22:44:38 - INFO - __main__ - Step 10784: {'lr': 0.0004956677473761871, 'samples': 2070528, 'steps': 10783, 'loss/train': 1.8574343919754028} +11/06/2021 22:44:38 - INFO - __main__ - Step 10785: {'lr': 0.0004956667636713427, 'samples': 2070720, 'steps': 10784, 'loss/train': 1.5868165493011475} +11/06/2021 22:44:39 - INFO - __main__ - Step 10786: {'lr': 0.0004956657798558047, 'samples': 2070912, 'steps': 10785, 'loss/train': 1.4748395681381226} +11/06/2021 22:44:39 - INFO - __main__ - Step 10787: {'lr': 0.0004956647959295735, 'samples': 2071104, 'steps': 10786, 'loss/train': 1.701545000076294} +11/06/2021 22:44:40 - INFO - __main__ - Step 10788: {'lr': 0.0004956638118926495, 'samples': 2071296, 'steps': 10787, 'loss/train': 1.976759910583496} +11/06/2021 22:44:40 - INFO - __main__ - Step 10789: {'lr': 0.0004956628277450333, 'samples': 2071488, 'steps': 10788, 'loss/train': 2.1454813480377197} +11/06/2021 22:44:41 - INFO - __main__ - Step 10790: {'lr': 0.0004956618434867251, 'samples': 2071680, 'steps': 10789, 'loss/train': 1.5759694576263428} +11/06/2021 22:44:41 - INFO - __main__ - Step 10791: {'lr': 0.0004956608591177256, 'samples': 2071872, 'steps': 10790, 'loss/train': 1.8092042207717896} +11/06/2021 22:44:41 - INFO - __main__ - Step 10792: {'lr': 0.0004956598746380349, 'samples': 2072064, 'steps': 10791, 'loss/train': 1.6778979301452637} +11/06/2021 22:44:43 - INFO - __main__ - Step 10793: {'lr': 0.0004956588900476538, 'samples': 2072256, 'steps': 10792, 'loss/train': 1.459761381149292} +11/06/2021 22:44:43 - INFO - __main__ - Step 10794: {'lr': 0.0004956579053465826, 'samples': 2072448, 'steps': 10793, 'loss/train': 1.5399609804153442} +11/06/2021 22:44:43 - INFO - __main__ - Step 10795: {'lr': 0.0004956569205348217, 'samples': 2072640, 'steps': 10794, 'loss/train': 1.4473868608474731} +11/06/2021 22:44:44 - INFO - __main__ - Step 10796: {'lr': 0.0004956559356123717, 'samples': 2072832, 'steps': 10795, 'loss/train': 1.825037956237793} +11/06/2021 22:44:44 - INFO - __main__ - Step 10797: {'lr': 0.0004956549505792327, 'samples': 2073024, 'steps': 10796, 'loss/train': 2.264521360397339} +11/06/2021 22:44:45 - INFO - __main__ - Step 10798: {'lr': 0.0004956539654354055, 'samples': 2073216, 'steps': 10797, 'loss/train': 1.450287938117981} +11/06/2021 22:44:45 - INFO - __main__ - Step 10799: {'lr': 0.0004956529801808904, 'samples': 2073408, 'steps': 10798, 'loss/train': 1.9415364265441895} +11/06/2021 22:44:46 - INFO - __main__ - Step 10800: {'lr': 0.0004956519948156879, 'samples': 2073600, 'steps': 10799, 'loss/train': 1.7281900644302368} +11/06/2021 22:44:46 - INFO - __main__ - Step 10801: {'lr': 0.0004956510093397983, 'samples': 2073792, 'steps': 10800, 'loss/train': 1.6848071813583374} +11/06/2021 22:44:46 - INFO - __main__ - Step 10802: {'lr': 0.0004956500237532222, 'samples': 2073984, 'steps': 10801, 'loss/train': 2.119485855102539} +11/06/2021 22:44:47 - INFO - __main__ - Step 10803: {'lr': 0.0004956490380559601, 'samples': 2074176, 'steps': 10802, 'loss/train': 1.7440723180770874} +11/06/2021 22:44:48 - INFO - __main__ - Step 10804: {'lr': 0.0004956480522480121, 'samples': 2074368, 'steps': 10803, 'loss/train': 1.6248648166656494} +11/06/2021 22:44:48 - INFO - __main__ - Step 10805: {'lr': 0.000495647066329379, 'samples': 2074560, 'steps': 10804, 'loss/train': 2.111401081085205} +11/06/2021 22:44:49 - INFO - __main__ - Step 10806: {'lr': 0.0004956460803000612, 'samples': 2074752, 'steps': 10805, 'loss/train': 2.2455363273620605} +11/06/2021 22:44:49 - INFO - __main__ - Step 10807: {'lr': 0.0004956450941600589, 'samples': 2074944, 'steps': 10806, 'loss/train': 4.325562477111816} +11/06/2021 22:44:49 - INFO - __main__ - Step 10808: {'lr': 0.0004956441079093729, 'samples': 2075136, 'steps': 10807, 'loss/train': 1.592270851135254} +11/06/2021 22:44:50 - INFO - __main__ - Step 10809: {'lr': 0.0004956431215480034, 'samples': 2075328, 'steps': 10808, 'loss/train': 1.865347981452942} +11/06/2021 22:44:51 - INFO - __main__ - Step 10810: {'lr': 0.0004956421350759508, 'samples': 2075520, 'steps': 10809, 'loss/train': 1.3117084503173828} +11/06/2021 22:44:51 - INFO - __main__ - Step 10811: {'lr': 0.0004956411484932158, 'samples': 2075712, 'steps': 10810, 'loss/train': 1.8176014423370361} +11/06/2021 22:44:51 - INFO - __main__ - Step 10812: {'lr': 0.0004956401617997985, 'samples': 2075904, 'steps': 10811, 'loss/train': 1.2668240070343018} +11/06/2021 22:44:52 - INFO - __main__ - Step 10813: {'lr': 0.0004956391749956997, 'samples': 2076096, 'steps': 10812, 'loss/train': 2.1930673122406006} +11/06/2021 22:44:53 - INFO - __main__ - Step 10814: {'lr': 0.0004956381880809195, 'samples': 2076288, 'steps': 10813, 'loss/train': 2.0894155502319336} +11/06/2021 22:44:53 - INFO - __main__ - Step 10815: {'lr': 0.0004956372010554587, 'samples': 2076480, 'steps': 10814, 'loss/train': 1.8282910585403442} +11/06/2021 22:44:54 - INFO - __main__ - Step 10816: {'lr': 0.0004956362139193174, 'samples': 2076672, 'steps': 10815, 'loss/train': 2.062333345413208} +11/06/2021 22:44:54 - INFO - __main__ - Step 10817: {'lr': 0.0004956352266724964, 'samples': 2076864, 'steps': 10816, 'loss/train': 1.4473098516464233} +11/06/2021 22:44:54 - INFO - __main__ - Step 10818: {'lr': 0.0004956342393149959, 'samples': 2077056, 'steps': 10817, 'loss/train': 1.7274878025054932} +11/06/2021 22:44:56 - INFO - __main__ - Step 10819: {'lr': 0.0004956332518468163, 'samples': 2077248, 'steps': 10818, 'loss/train': 1.570633053779602} +11/06/2021 22:44:56 - INFO - __main__ - Step 10820: {'lr': 0.0004956322642679583, 'samples': 2077440, 'steps': 10819, 'loss/train': 1.7297214269638062} +11/06/2021 22:44:56 - INFO - __main__ - Step 10821: {'lr': 0.000495631276578422, 'samples': 2077632, 'steps': 10820, 'loss/train': 4.519792079925537} +11/06/2021 22:44:57 - INFO - __main__ - Step 10822: {'lr': 0.0004956302887782082, 'samples': 2077824, 'steps': 10821, 'loss/train': 1.0446696281433105} +11/06/2021 22:44:57 - INFO - __main__ - Step 10823: {'lr': 0.0004956293008673172, 'samples': 2078016, 'steps': 10822, 'loss/train': 0.5035202503204346} +11/06/2021 22:44:57 - INFO - __main__ - Step 10824: {'lr': 0.0004956283128457493, 'samples': 2078208, 'steps': 10823, 'loss/train': 0.34573525190353394} +11/06/2021 22:44:58 - INFO - __main__ - Step 10825: {'lr': 0.0004956273247135051, 'samples': 2078400, 'steps': 10824, 'loss/train': 1.6415156126022339} +11/06/2021 22:44:59 - INFO - __main__ - Step 10826: {'lr': 0.0004956263364705851, 'samples': 2078592, 'steps': 10825, 'loss/train': 1.6332308053970337} +11/06/2021 22:44:59 - INFO - __main__ - Step 10827: {'lr': 0.0004956253481169895, 'samples': 2078784, 'steps': 10826, 'loss/train': 2.319352865219116} +11/06/2021 22:44:59 - INFO - __main__ - Step 10828: {'lr': 0.0004956243596527191, 'samples': 2078976, 'steps': 10827, 'loss/train': 1.773661494255066} +11/06/2021 22:45:00 - INFO - __main__ - Step 10829: {'lr': 0.000495623371077774, 'samples': 2079168, 'steps': 10828, 'loss/train': 1.8046337366104126} +11/06/2021 22:45:01 - INFO - __main__ - Step 10830: {'lr': 0.000495622382392155, 'samples': 2079360, 'steps': 10829, 'loss/train': 1.06633460521698} +11/06/2021 22:45:01 - INFO - __main__ - Step 10831: {'lr': 0.0004956213935958621, 'samples': 2079552, 'steps': 10830, 'loss/train': 1.7313029766082764} +11/06/2021 22:45:02 - INFO - __main__ - Step 10832: {'lr': 0.0004956204046888961, 'samples': 2079744, 'steps': 10831, 'loss/train': 1.655548095703125} +11/06/2021 22:45:02 - INFO - __main__ - Step 10833: {'lr': 0.0004956194156712574, 'samples': 2079936, 'steps': 10832, 'loss/train': 2.0152714252471924} +11/06/2021 22:45:02 - INFO - __main__ - Step 10834: {'lr': 0.0004956184265429463, 'samples': 2080128, 'steps': 10833, 'loss/train': 2.010787010192871} +11/06/2021 22:45:03 - INFO - __main__ - Step 10835: {'lr': 0.0004956174373039634, 'samples': 2080320, 'steps': 10834, 'loss/train': 1.838008999824524} +11/06/2021 22:45:04 - INFO - __main__ - Step 10836: {'lr': 0.0004956164479543089, 'samples': 2080512, 'steps': 10835, 'loss/train': 1.985622525215149} +11/06/2021 22:45:04 - INFO - __main__ - Step 10837: {'lr': 0.0004956154584939836, 'samples': 2080704, 'steps': 10836, 'loss/train': 1.8421908617019653} +11/06/2021 22:45:04 - INFO - __main__ - Step 10838: {'lr': 0.0004956144689229877, 'samples': 2080896, 'steps': 10837, 'loss/train': 2.1746902465820312} +11/06/2021 22:45:05 - INFO - __main__ - Step 10839: {'lr': 0.0004956134792413218, 'samples': 2081088, 'steps': 10838, 'loss/train': 1.700150966644287} +11/06/2021 22:45:05 - INFO - __main__ - Step 10840: {'lr': 0.0004956124894489861, 'samples': 2081280, 'steps': 10839, 'loss/train': 2.058382749557495} +11/06/2021 22:45:06 - INFO - __main__ - Step 10841: {'lr': 0.0004956114995459813, 'samples': 2081472, 'steps': 10840, 'loss/train': 6.1868720054626465} +11/06/2021 22:45:06 - INFO - __main__ - Step 10842: {'lr': 0.0004956105095323077, 'samples': 2081664, 'steps': 10841, 'loss/train': 1.7854186296463013} +11/06/2021 22:45:07 - INFO - __main__ - Step 10843: {'lr': 0.0004956095194079658, 'samples': 2081856, 'steps': 10842, 'loss/train': 1.8103166818618774} +11/06/2021 22:45:07 - INFO - __main__ - Step 10844: {'lr': 0.000495608529172956, 'samples': 2082048, 'steps': 10843, 'loss/train': 1.3330121040344238} +11/06/2021 22:45:08 - INFO - __main__ - Step 10845: {'lr': 0.0004956075388272789, 'samples': 2082240, 'steps': 10844, 'loss/train': 1.5644762516021729} +11/06/2021 22:45:09 - INFO - __main__ - Step 10846: {'lr': 0.0004956065483709348, 'samples': 2082432, 'steps': 10845, 'loss/train': 1.6880342960357666} +11/06/2021 22:45:09 - INFO - __main__ - Step 10847: {'lr': 0.0004956055578039241, 'samples': 2082624, 'steps': 10846, 'loss/train': 1.727042317390442} +11/06/2021 22:45:09 - INFO - __main__ - Step 10848: {'lr': 0.0004956045671262475, 'samples': 2082816, 'steps': 10847, 'loss/train': 1.3795113563537598} +11/06/2021 22:45:10 - INFO - __main__ - Step 10849: {'lr': 0.0004956035763379051, 'samples': 2083008, 'steps': 10848, 'loss/train': 1.9024347066879272} +11/06/2021 22:45:10 - INFO - __main__ - Step 10850: {'lr': 0.0004956025854388976, 'samples': 2083200, 'steps': 10849, 'loss/train': 0.8960413336753845} +11/06/2021 22:45:11 - INFO - __main__ - Step 10851: {'lr': 0.0004956015944292253, 'samples': 2083392, 'steps': 10850, 'loss/train': 2.1259398460388184} +11/06/2021 22:45:11 - INFO - __main__ - Step 10852: {'lr': 0.0004956006033088888, 'samples': 2083584, 'steps': 10851, 'loss/train': 1.9654005765914917} +11/06/2021 22:45:12 - INFO - __main__ - Step 10853: {'lr': 0.0004955996120778884, 'samples': 2083776, 'steps': 10852, 'loss/train': 1.8148349523544312} +11/06/2021 22:45:12 - INFO - __main__ - Step 10854: {'lr': 0.0004955986207362246, 'samples': 2083968, 'steps': 10853, 'loss/train': 0.7852979898452759} +11/06/2021 22:45:12 - INFO - __main__ - Step 10855: {'lr': 0.0004955976292838979, 'samples': 2084160, 'steps': 10854, 'loss/train': 1.4349844455718994} +11/06/2021 22:45:14 - INFO - __main__ - Step 10856: {'lr': 0.0004955966377209086, 'samples': 2084352, 'steps': 10855, 'loss/train': 1.8268946409225464} +11/06/2021 22:45:14 - INFO - __main__ - Step 10857: {'lr': 0.0004955956460472573, 'samples': 2084544, 'steps': 10856, 'loss/train': 2.225966453552246} +11/06/2021 22:45:14 - INFO - __main__ - Step 10858: {'lr': 0.0004955946542629444, 'samples': 2084736, 'steps': 10857, 'loss/train': 1.7703862190246582} +11/06/2021 22:45:15 - INFO - __main__ - Step 10859: {'lr': 0.0004955936623679703, 'samples': 2084928, 'steps': 10858, 'loss/train': 2.2991316318511963} +11/06/2021 22:45:15 - INFO - __main__ - Step 10860: {'lr': 0.0004955926703623356, 'samples': 2085120, 'steps': 10859, 'loss/train': 2.4180328845977783} +11/06/2021 22:45:15 - INFO - __main__ - Step 10861: {'lr': 0.0004955916782460405, 'samples': 2085312, 'steps': 10860, 'loss/train': 2.1252551078796387} +11/06/2021 22:45:16 - INFO - __main__ - Step 10862: {'lr': 0.0004955906860190857, 'samples': 2085504, 'steps': 10861, 'loss/train': 1.9650782346725464} +11/06/2021 22:45:17 - INFO - __main__ - Step 10863: {'lr': 0.0004955896936814714, 'samples': 2085696, 'steps': 10862, 'loss/train': 1.8924416303634644} +11/06/2021 22:45:17 - INFO - __main__ - Step 10864: {'lr': 0.0004955887012331982, 'samples': 2085888, 'steps': 10863, 'loss/train': 1.7115322351455688} +11/06/2021 22:45:17 - INFO - __main__ - Step 10865: {'lr': 0.0004955877086742666, 'samples': 2086080, 'steps': 10864, 'loss/train': 1.3016084432601929} +11/06/2021 22:45:18 - INFO - __main__ - Step 10866: {'lr': 0.0004955867160046769, 'samples': 2086272, 'steps': 10865, 'loss/train': 1.6526113748550415} +11/06/2021 22:45:19 - INFO - __main__ - Step 10867: {'lr': 0.0004955857232244297, 'samples': 2086464, 'steps': 10866, 'loss/train': 1.5143797397613525} +11/06/2021 22:45:19 - INFO - __main__ - Step 10868: {'lr': 0.0004955847303335253, 'samples': 2086656, 'steps': 10867, 'loss/train': 1.8986718654632568} +11/06/2021 22:45:19 - INFO - __main__ - Step 10869: {'lr': 0.0004955837373319641, 'samples': 2086848, 'steps': 10868, 'loss/train': 1.6956390142440796} +11/06/2021 22:45:20 - INFO - __main__ - Step 10870: {'lr': 0.0004955827442197468, 'samples': 2087040, 'steps': 10869, 'loss/train': 1.9190312623977661} +11/06/2021 22:45:20 - INFO - __main__ - Step 10871: {'lr': 0.0004955817509968737, 'samples': 2087232, 'steps': 10870, 'loss/train': 1.3590363264083862} +11/06/2021 22:45:21 - INFO - __main__ - Step 10872: {'lr': 0.0004955807576633452, 'samples': 2087424, 'steps': 10871, 'loss/train': 1.7737996578216553} +11/06/2021 22:45:22 - INFO - __main__ - Step 10873: {'lr': 0.0004955797642191618, 'samples': 2087616, 'steps': 10872, 'loss/train': 1.8622442483901978} +11/06/2021 22:45:22 - INFO - __main__ - Step 10874: {'lr': 0.000495578770664324, 'samples': 2087808, 'steps': 10873, 'loss/train': 1.9006373882293701} +11/06/2021 22:45:22 - INFO - __main__ - Step 10875: {'lr': 0.0004955777769988322, 'samples': 2088000, 'steps': 10874, 'loss/train': 2.0556890964508057} +11/06/2021 22:45:23 - INFO - __main__ - Step 10876: {'lr': 0.0004955767832226868, 'samples': 2088192, 'steps': 10875, 'loss/train': 1.6354632377624512} +11/06/2021 22:45:24 - INFO - __main__ - Step 10877: {'lr': 0.0004955757893358884, 'samples': 2088384, 'steps': 10876, 'loss/train': 1.777341365814209} +11/06/2021 22:45:24 - INFO - __main__ - Step 10878: {'lr': 0.0004955747953384372, 'samples': 2088576, 'steps': 10877, 'loss/train': 1.4678032398223877} +11/06/2021 22:45:25 - INFO - __main__ - Step 10879: {'lr': 0.0004955738012303338, 'samples': 2088768, 'steps': 10878, 'loss/train': 2.07291579246521} +11/06/2021 22:45:25 - INFO - __main__ - Step 10880: {'lr': 0.0004955728070115787, 'samples': 2088960, 'steps': 10879, 'loss/train': 1.9695255756378174} +11/06/2021 22:45:25 - INFO - __main__ - Step 10881: {'lr': 0.0004955718126821722, 'samples': 2089152, 'steps': 10880, 'loss/train': 2.657900094985962} +11/06/2021 22:45:26 - INFO - __main__ - Step 10882: {'lr': 0.0004955708182421149, 'samples': 2089344, 'steps': 10881, 'loss/train': 1.587023377418518} +11/06/2021 22:45:26 - INFO - __main__ - Step 10883: {'lr': 0.0004955698236914071, 'samples': 2089536, 'steps': 10882, 'loss/train': 1.4646183252334595} +11/06/2021 22:45:27 - INFO - __main__ - Step 10884: {'lr': 0.0004955688290300494, 'samples': 2089728, 'steps': 10883, 'loss/train': 2.305067539215088} +11/06/2021 22:45:27 - INFO - __main__ - Step 10885: {'lr': 0.0004955678342580421, 'samples': 2089920, 'steps': 10884, 'loss/train': 2.04618501663208} +11/06/2021 22:45:28 - INFO - __main__ - Step 10886: {'lr': 0.0004955668393753858, 'samples': 2090112, 'steps': 10885, 'loss/train': 1.8852858543395996} +11/06/2021 22:45:28 - INFO - __main__ - Step 10887: {'lr': 0.0004955658443820809, 'samples': 2090304, 'steps': 10886, 'loss/train': 1.9681472778320312} +11/06/2021 22:45:28 - INFO - __main__ - Step 10888: {'lr': 0.0004955648492781277, 'samples': 2090496, 'steps': 10887, 'loss/train': 2.0879921913146973} +11/06/2021 22:45:30 - INFO - __main__ - Step 10889: {'lr': 0.0004955638540635269, 'samples': 2090688, 'steps': 10888, 'loss/train': 1.7729140520095825} +11/06/2021 22:45:30 - INFO - __main__ - Step 10890: {'lr': 0.0004955628587382788, 'samples': 2090880, 'steps': 10889, 'loss/train': 1.8550975322723389} +11/06/2021 22:45:30 - INFO - __main__ - Step 10891: {'lr': 0.0004955618633023837, 'samples': 2091072, 'steps': 10890, 'loss/train': 1.8905608654022217} +11/06/2021 22:45:31 - INFO - __main__ - Step 10892: {'lr': 0.0004955608677558424, 'samples': 2091264, 'steps': 10891, 'loss/train': 1.5222508907318115} +11/06/2021 22:45:31 - INFO - __main__ - Step 10893: {'lr': 0.0004955598720986551, 'samples': 2091456, 'steps': 10892, 'loss/train': 1.770163655281067} +11/06/2021 22:45:32 - INFO - __main__ - Step 10894: {'lr': 0.0004955588763308223, 'samples': 2091648, 'steps': 10893, 'loss/train': 1.9412416219711304} +11/06/2021 22:45:32 - INFO - __main__ - Step 10895: {'lr': 0.0004955578804523445, 'samples': 2091840, 'steps': 10894, 'loss/train': 1.9182251691818237} +11/06/2021 22:45:33 - INFO - __main__ - Step 10896: {'lr': 0.000495556884463222, 'samples': 2092032, 'steps': 10895, 'loss/train': 1.7548394203186035} +11/06/2021 22:45:33 - INFO - __main__ - Step 10897: {'lr': 0.0004955558883634555, 'samples': 2092224, 'steps': 10896, 'loss/train': 2.1378374099731445} +11/06/2021 22:45:33 - INFO - __main__ - Step 10898: {'lr': 0.0004955548921530452, 'samples': 2092416, 'steps': 10897, 'loss/train': 1.4862196445465088} +11/06/2021 22:45:34 - INFO - __main__ - Step 10899: {'lr': 0.0004955538958319917, 'samples': 2092608, 'steps': 10898, 'loss/train': 1.4818750619888306} +11/06/2021 22:45:35 - INFO - __main__ - Step 10900: {'lr': 0.0004955528994002954, 'samples': 2092800, 'steps': 10899, 'loss/train': 2.25352144241333} +11/06/2021 22:45:35 - INFO - __main__ - Step 10901: {'lr': 0.0004955519028579568, 'samples': 2092992, 'steps': 10900, 'loss/train': 1.904826045036316} +11/06/2021 22:45:35 - INFO - __main__ - Step 10902: {'lr': 0.0004955509062049763, 'samples': 2093184, 'steps': 10901, 'loss/train': 2.2646710872650146} +11/06/2021 22:45:36 - INFO - __main__ - Step 10903: {'lr': 0.0004955499094413542, 'samples': 2093376, 'steps': 10902, 'loss/train': 1.8453540802001953} +11/06/2021 22:45:37 - INFO - __main__ - Step 10904: {'lr': 0.0004955489125670912, 'samples': 2093568, 'steps': 10903, 'loss/train': 1.2901415824890137} +11/06/2021 22:45:37 - INFO - __main__ - Step 10905: {'lr': 0.0004955479155821877, 'samples': 2093760, 'steps': 10904, 'loss/train': 1.7908188104629517} +11/06/2021 22:45:37 - INFO - __main__ - Step 10906: {'lr': 0.000495546918486644, 'samples': 2093952, 'steps': 10905, 'loss/train': 1.9787135124206543} +11/06/2021 22:45:38 - INFO - __main__ - Step 10907: {'lr': 0.0004955459212804607, 'samples': 2094144, 'steps': 10906, 'loss/train': 0.762311577796936} +11/06/2021 22:45:38 - INFO - __main__ - Step 10908: {'lr': 0.0004955449239636382, 'samples': 2094336, 'steps': 10907, 'loss/train': 1.5875378847122192} +11/06/2021 22:45:38 - INFO - __main__ - Step 10909: {'lr': 0.000495543926536177, 'samples': 2094528, 'steps': 10908, 'loss/train': 1.9852023124694824} +11/06/2021 22:45:39 - INFO - __main__ - Step 10910: {'lr': 0.0004955429289980774, 'samples': 2094720, 'steps': 10909, 'loss/train': 1.7083479166030884} +11/06/2021 22:45:40 - INFO - __main__ - Step 10911: {'lr': 0.00049554193134934, 'samples': 2094912, 'steps': 10910, 'loss/train': 2.226473808288574} +11/06/2021 22:45:40 - INFO - __main__ - Step 10912: {'lr': 0.0004955409335899651, 'samples': 2095104, 'steps': 10911, 'loss/train': 1.7257845401763916} +11/06/2021 22:45:40 - INFO - __main__ - Step 10913: {'lr': 0.0004955399357199534, 'samples': 2095296, 'steps': 10912, 'loss/train': 1.5614092350006104} +11/06/2021 22:45:41 - INFO - __main__ - Step 10914: {'lr': 0.0004955389377393051, 'samples': 2095488, 'steps': 10913, 'loss/train': 1.6544125080108643} +11/06/2021 22:45:42 - INFO - __main__ - Step 10915: {'lr': 0.0004955379396480207, 'samples': 2095680, 'steps': 10914, 'loss/train': 2.452582836151123} +11/06/2021 22:45:42 - INFO - __main__ - Step 10916: {'lr': 0.0004955369414461007, 'samples': 2095872, 'steps': 10915, 'loss/train': 1.0178364515304565} +11/06/2021 22:45:43 - INFO - __main__ - Step 10917: {'lr': 0.0004955359431335456, 'samples': 2096064, 'steps': 10916, 'loss/train': 0.8691990375518799} +11/06/2021 22:45:43 - INFO - __main__ - Step 10918: {'lr': 0.0004955349447103559, 'samples': 2096256, 'steps': 10917, 'loss/train': 1.4804587364196777} +11/06/2021 22:45:43 - INFO - __main__ - Step 10919: {'lr': 0.0004955339461765318, 'samples': 2096448, 'steps': 10918, 'loss/train': 1.8954075574874878} +11/06/2021 22:45:44 - INFO - __main__ - Step 10920: {'lr': 0.0004955329475320739, 'samples': 2096640, 'steps': 10919, 'loss/train': 1.3000982999801636} +11/06/2021 22:45:45 - INFO - __main__ - Step 10921: {'lr': 0.0004955319487769827, 'samples': 2096832, 'steps': 10920, 'loss/train': 1.6396160125732422} +11/06/2021 22:45:45 - INFO - __main__ - Step 10922: {'lr': 0.0004955309499112586, 'samples': 2097024, 'steps': 10921, 'loss/train': 1.534606695175171} +11/06/2021 22:45:45 - INFO - __main__ - Step 10923: {'lr': 0.000495529950934902, 'samples': 2097216, 'steps': 10922, 'loss/train': 1.6064701080322266} +11/06/2021 22:45:46 - INFO - __main__ - Step 10924: {'lr': 0.0004955289518479134, 'samples': 2097408, 'steps': 10923, 'loss/train': 1.5156863927841187} +11/06/2021 22:45:47 - INFO - __main__ - Step 10925: {'lr': 0.0004955279526502931, 'samples': 2097600, 'steps': 10924, 'loss/train': 1.9213401079177856} +11/06/2021 22:45:47 - INFO - __main__ - Step 10926: {'lr': 0.0004955269533420419, 'samples': 2097792, 'steps': 10925, 'loss/train': 1.5095373392105103} +11/06/2021 22:45:47 - INFO - __main__ - Step 10927: {'lr': 0.00049552595392316, 'samples': 2097984, 'steps': 10926, 'loss/train': 1.9724854230880737} +11/06/2021 22:45:48 - INFO - __main__ - Step 10928: {'lr': 0.0004955249543936479, 'samples': 2098176, 'steps': 10927, 'loss/train': 1.7889426946640015} +11/06/2021 22:45:48 - INFO - __main__ - Step 10929: {'lr': 0.000495523954753506, 'samples': 2098368, 'steps': 10928, 'loss/train': 2.7239041328430176} +11/06/2021 22:45:49 - INFO - __main__ - Step 10930: {'lr': 0.0004955229550027347, 'samples': 2098560, 'steps': 10929, 'loss/train': 1.7207810878753662} +11/06/2021 22:45:49 - INFO - __main__ - Step 10931: {'lr': 0.0004955219551413347, 'samples': 2098752, 'steps': 10930, 'loss/train': 1.4292515516281128} +11/06/2021 22:45:50 - INFO - __main__ - Step 10932: {'lr': 0.0004955209551693063, 'samples': 2098944, 'steps': 10931, 'loss/train': 2.1134376525878906} +11/06/2021 22:45:50 - INFO - __main__ - Step 10933: {'lr': 0.0004955199550866498, 'samples': 2099136, 'steps': 10932, 'loss/train': 1.5380351543426514} +11/06/2021 22:45:51 - INFO - __main__ - Step 10934: {'lr': 0.000495518954893366, 'samples': 2099328, 'steps': 10933, 'loss/train': 1.7026230096817017} +11/06/2021 22:45:51 - INFO - __main__ - Step 10935: {'lr': 0.000495517954589455, 'samples': 2099520, 'steps': 10934, 'loss/train': 1.979361891746521} +11/06/2021 22:45:52 - INFO - __main__ - Step 10936: {'lr': 0.0004955169541749173, 'samples': 2099712, 'steps': 10935, 'loss/train': 1.7494332790374756} +11/06/2021 22:45:52 - INFO - __main__ - Step 10937: {'lr': 0.0004955159536497536, 'samples': 2099904, 'steps': 10936, 'loss/train': 1.8730812072753906} +11/06/2021 22:45:53 - INFO - __main__ - Step 10938: {'lr': 0.0004955149530139643, 'samples': 2100096, 'steps': 10937, 'loss/train': 1.707970142364502} +11/06/2021 22:45:53 - INFO - __main__ - Step 10939: {'lr': 0.0004955139522675496, 'samples': 2100288, 'steps': 10938, 'loss/train': 2.6687307357788086} +11/06/2021 22:45:53 - INFO - __main__ - Step 10940: {'lr': 0.0004955129514105101, 'samples': 2100480, 'steps': 10939, 'loss/train': 2.0217690467834473} +11/06/2021 22:45:54 - INFO - __main__ - Step 10941: {'lr': 0.0004955119504428464, 'samples': 2100672, 'steps': 10940, 'loss/train': 1.6573915481567383} +11/06/2021 22:45:55 - INFO - __main__ - Step 10942: {'lr': 0.0004955109493645587, 'samples': 2100864, 'steps': 10941, 'loss/train': 1.8716685771942139} +11/06/2021 22:45:55 - INFO - __main__ - Step 10943: {'lr': 0.0004955099481756475, 'samples': 2101056, 'steps': 10942, 'loss/train': 2.186129331588745} +11/06/2021 22:45:55 - INFO - __main__ - Step 10944: {'lr': 0.0004955089468761133, 'samples': 2101248, 'steps': 10943, 'loss/train': 2.171231985092163} +11/06/2021 22:45:56 - INFO - __main__ - Step 10945: {'lr': 0.0004955079454659567, 'samples': 2101440, 'steps': 10944, 'loss/train': 1.6056174039840698} +11/06/2021 22:45:57 - INFO - __main__ - Step 10946: {'lr': 0.0004955069439451778, 'samples': 2101632, 'steps': 10945, 'loss/train': 1.8130086660385132} +11/06/2021 22:45:57 - INFO - __main__ - Step 10947: {'lr': 0.0004955059423137774, 'samples': 2101824, 'steps': 10946, 'loss/train': 1.8952678442001343} +11/06/2021 22:45:57 - INFO - __main__ - Step 10948: {'lr': 0.0004955049405717558, 'samples': 2102016, 'steps': 10947, 'loss/train': 1.9916630983352661} +11/06/2021 22:45:58 - INFO - __main__ - Step 10949: {'lr': 0.0004955039387191135, 'samples': 2102208, 'steps': 10948, 'loss/train': 1.791800618171692} +11/06/2021 22:45:58 - INFO - __main__ - Step 10950: {'lr': 0.0004955029367558508, 'samples': 2102400, 'steps': 10949, 'loss/train': 1.4076131582260132} +11/06/2021 22:45:59 - INFO - __main__ - Step 10951: {'lr': 0.0004955019346819684, 'samples': 2102592, 'steps': 10950, 'loss/train': 1.7060812711715698} +11/06/2021 22:45:59 - INFO - __main__ - Step 10952: {'lr': 0.0004955009324974666, 'samples': 2102784, 'steps': 10951, 'loss/train': 1.271490216255188} +11/06/2021 22:46:00 - INFO - __main__ - Step 10953: {'lr': 0.0004954999302023458, 'samples': 2102976, 'steps': 10952, 'loss/train': 2.104248046875} +11/06/2021 22:46:00 - INFO - __main__ - Step 10954: {'lr': 0.0004954989277966064, 'samples': 2103168, 'steps': 10953, 'loss/train': 1.4961109161376953} +11/06/2021 22:46:01 - INFO - __main__ - Step 10955: {'lr': 0.0004954979252802491, 'samples': 2103360, 'steps': 10954, 'loss/train': 1.854745626449585} +11/06/2021 22:46:02 - INFO - __main__ - Step 10956: {'lr': 0.0004954969226532743, 'samples': 2103552, 'steps': 10955, 'loss/train': 1.7922343015670776} +11/06/2021 22:46:02 - INFO - __main__ - Step 10957: {'lr': 0.0004954959199156824, 'samples': 2103744, 'steps': 10956, 'loss/train': 2.0796141624450684} +11/06/2021 22:46:02 - INFO - __main__ - Step 10958: {'lr': 0.0004954949170674736, 'samples': 2103936, 'steps': 10957, 'loss/train': 2.0407614707946777} +11/06/2021 22:46:03 - INFO - __main__ - Step 10959: {'lr': 0.0004954939141086488, 'samples': 2104128, 'steps': 10958, 'loss/train': 1.2875730991363525} +11/06/2021 22:46:03 - INFO - __main__ - Step 10960: {'lr': 0.0004954929110392081, 'samples': 2104320, 'steps': 10959, 'loss/train': 1.918273687362671} +11/06/2021 22:46:04 - INFO - __main__ - Step 10961: {'lr': 0.0004954919078591521, 'samples': 2104512, 'steps': 10960, 'loss/train': 1.7532039880752563} +11/06/2021 22:46:05 - INFO - __main__ - Step 10962: {'lr': 0.0004954909045684812, 'samples': 2104704, 'steps': 10961, 'loss/train': 1.595262050628662} +11/06/2021 22:46:05 - INFO - __main__ - Step 10963: {'lr': 0.000495489901167196, 'samples': 2104896, 'steps': 10962, 'loss/train': 1.8555185794830322} +11/06/2021 22:46:05 - INFO - __main__ - Step 10964: {'lr': 0.0004954888976552968, 'samples': 2105088, 'steps': 10963, 'loss/train': 1.559324026107788} +11/06/2021 22:46:06 - INFO - __main__ - Step 10965: {'lr': 0.0004954878940327841, 'samples': 2105280, 'steps': 10964, 'loss/train': 1.616891860961914} +11/06/2021 22:46:07 - INFO - __main__ - Step 10966: {'lr': 0.0004954868902996582, 'samples': 2105472, 'steps': 10965, 'loss/train': 1.9043447971343994} +11/06/2021 22:46:07 - INFO - __main__ - Step 10967: {'lr': 0.0004954858864559199, 'samples': 2105664, 'steps': 10966, 'loss/train': 2.002821922302246} +11/06/2021 22:46:07 - INFO - __main__ - Step 10968: {'lr': 0.0004954848825015694, 'samples': 2105856, 'steps': 10967, 'loss/train': 1.3038442134857178} +11/06/2021 22:46:08 - INFO - __main__ - Step 10969: {'lr': 0.0004954838784366071, 'samples': 2106048, 'steps': 10968, 'loss/train': 1.6041873693466187} +11/06/2021 22:46:08 - INFO - __main__ - Step 10970: {'lr': 0.0004954828742610336, 'samples': 2106240, 'steps': 10969, 'loss/train': 2.28267502784729} +11/06/2021 22:46:09 - INFO - __main__ - Step 10971: {'lr': 0.0004954818699748493, 'samples': 2106432, 'steps': 10970, 'loss/train': 1.9312834739685059} +11/06/2021 22:46:09 - INFO - __main__ - Step 10972: {'lr': 0.0004954808655780546, 'samples': 2106624, 'steps': 10971, 'loss/train': 1.7641648054122925} +11/06/2021 22:46:10 - INFO - __main__ - Step 10973: {'lr': 0.0004954798610706502, 'samples': 2106816, 'steps': 10972, 'loss/train': 1.8444775342941284} +11/06/2021 22:46:10 - INFO - __main__ - Step 10974: {'lr': 0.0004954788564526362, 'samples': 2107008, 'steps': 10973, 'loss/train': 1.9866970777511597} +11/06/2021 22:46:10 - INFO - __main__ - Step 10975: {'lr': 0.0004954778517240133, 'samples': 2107200, 'steps': 10974, 'loss/train': 1.7459683418273926} +11/06/2021 22:46:11 - INFO - __main__ - Step 10976: {'lr': 0.0004954768468847818, 'samples': 2107392, 'steps': 10975, 'loss/train': 3.977201223373413} +11/06/2021 22:46:12 - INFO - __main__ - Step 10977: {'lr': 0.0004954758419349422, 'samples': 2107584, 'steps': 10976, 'loss/train': 1.9195420742034912} +11/06/2021 22:46:12 - INFO - __main__ - Step 10978: {'lr': 0.000495474836874495, 'samples': 2107776, 'steps': 10977, 'loss/train': 1.9030547142028809} +11/06/2021 22:46:12 - INFO - __main__ - Step 10979: {'lr': 0.0004954738317034408, 'samples': 2107968, 'steps': 10978, 'loss/train': 1.9866000413894653} +11/06/2021 22:46:13 - INFO - __main__ - Step 10980: {'lr': 0.0004954728264217796, 'samples': 2108160, 'steps': 10979, 'loss/train': 1.738264560699463} +11/06/2021 22:46:13 - INFO - __main__ - Step 10981: {'lr': 0.0004954718210295123, 'samples': 2108352, 'steps': 10980, 'loss/train': 1.8209415674209595} +11/06/2021 22:46:14 - INFO - __main__ - Step 10982: {'lr': 0.0004954708155266392, 'samples': 2108544, 'steps': 10981, 'loss/train': 1.931311011314392} +11/06/2021 22:46:15 - INFO - __main__ - Step 10983: {'lr': 0.0004954698099131606, 'samples': 2108736, 'steps': 10982, 'loss/train': 2.182440996170044} +11/06/2021 22:46:15 - INFO - __main__ - Step 10984: {'lr': 0.0004954688041890772, 'samples': 2108928, 'steps': 10983, 'loss/train': 1.8009920120239258} +11/06/2021 22:46:15 - INFO - __main__ - Step 10985: {'lr': 0.0004954677983543893, 'samples': 2109120, 'steps': 10984, 'loss/train': 1.65086829662323} +11/06/2021 22:46:16 - INFO - __main__ - Step 10986: {'lr': 0.0004954667924090974, 'samples': 2109312, 'steps': 10985, 'loss/train': 2.294792413711548} +11/06/2021 22:46:17 - INFO - __main__ - Step 10987: {'lr': 0.000495465786353202, 'samples': 2109504, 'steps': 10986, 'loss/train': 1.9113411903381348} +11/06/2021 22:46:17 - INFO - __main__ - Step 10988: {'lr': 0.0004954647801867035, 'samples': 2109696, 'steps': 10987, 'loss/train': 1.2942930459976196} +11/06/2021 22:46:17 - INFO - __main__ - Step 10989: {'lr': 0.0004954637739096023, 'samples': 2109888, 'steps': 10988, 'loss/train': 2.1266255378723145} +11/06/2021 22:46:18 - INFO - __main__ - Step 10990: {'lr': 0.0004954627675218989, 'samples': 2110080, 'steps': 10989, 'loss/train': 1.2343058586120605} +11/06/2021 22:46:18 - INFO - __main__ - Step 10991: {'lr': 0.0004954617610235939, 'samples': 2110272, 'steps': 10990, 'loss/train': 1.7390135526657104} +11/06/2021 22:46:18 - INFO - __main__ - Step 10992: {'lr': 0.0004954607544146875, 'samples': 2110464, 'steps': 10991, 'loss/train': 1.8976117372512817} +11/06/2021 22:46:20 - INFO - __main__ - Step 10993: {'lr': 0.0004954597476951804, 'samples': 2110656, 'steps': 10992, 'loss/train': 1.9760702848434448} +11/06/2021 22:46:20 - INFO - __main__ - Step 10994: {'lr': 0.0004954587408650727, 'samples': 2110848, 'steps': 10993, 'loss/train': 2.1973133087158203} +11/06/2021 22:46:21 - INFO - __main__ - Step 10995: {'lr': 0.0004954577339243652, 'samples': 2111040, 'steps': 10994, 'loss/train': 1.842615008354187} +11/06/2021 22:46:21 - INFO - __main__ - Step 10996: {'lr': 0.0004954567268730582, 'samples': 2111232, 'steps': 10995, 'loss/train': 1.7507246732711792} +11/06/2021 22:46:21 - INFO - __main__ - Step 10997: {'lr': 0.0004954557197111522, 'samples': 2111424, 'steps': 10996, 'loss/train': 4.712644577026367} +11/06/2021 22:46:22 - INFO - __main__ - Step 10998: {'lr': 0.0004954547124386477, 'samples': 2111616, 'steps': 10997, 'loss/train': 2.954491138458252} +11/06/2021 22:46:23 - INFO - __main__ - Step 10999: {'lr': 0.0004954537050555451, 'samples': 2111808, 'steps': 10998, 'loss/train': 1.7333556413650513} +11/06/2021 22:46:23 - INFO - __main__ - Step 11000: {'lr': 0.0004954526975618447, 'samples': 2112000, 'steps': 10999, 'loss/train': 1.7559417486190796} +11/06/2021 22:46:23 - INFO - __main__ - Step 11001: {'lr': 0.0004954516899575473, 'samples': 2112192, 'steps': 11000, 'loss/train': 1.4720401763916016} +11/06/2021 22:46:24 - INFO - __main__ - Step 11002: {'lr': 0.000495450682242653, 'samples': 2112384, 'steps': 11001, 'loss/train': 1.7932754755020142} +11/06/2021 22:46:24 - INFO - __main__ - Step 11003: {'lr': 0.0004954496744171624, 'samples': 2112576, 'steps': 11002, 'loss/train': 2.697819232940674} +11/06/2021 22:46:25 - INFO - __main__ - Step 11004: {'lr': 0.0004954486664810762, 'samples': 2112768, 'steps': 11003, 'loss/train': 1.973361849784851} +11/06/2021 22:46:25 - INFO - __main__ - Step 11005: {'lr': 0.0004954476584343945, 'samples': 2112960, 'steps': 11004, 'loss/train': 1.4034092426300049} +11/06/2021 22:46:26 - INFO - __main__ - Step 11006: {'lr': 0.0004954466502771178, 'samples': 2113152, 'steps': 11005, 'loss/train': 1.6337881088256836} +11/06/2021 22:46:26 - INFO - __main__ - Step 11007: {'lr': 0.0004954456420092466, 'samples': 2113344, 'steps': 11006, 'loss/train': 1.6302669048309326} +11/06/2021 22:46:27 - INFO - __main__ - Step 11008: {'lr': 0.0004954446336307814, 'samples': 2113536, 'steps': 11007, 'loss/train': 1.5346612930297852} +11/06/2021 22:46:28 - INFO - __main__ - Step 11009: {'lr': 0.0004954436251417227, 'samples': 2113728, 'steps': 11008, 'loss/train': 1.931561827659607} +11/06/2021 22:46:29 - INFO - __main__ - Step 11010: {'lr': 0.0004954426165420709, 'samples': 2113920, 'steps': 11009, 'loss/train': 2.0047390460968018} +11/06/2021 22:46:29 - INFO - __main__ - Step 11011: {'lr': 0.0004954416078318263, 'samples': 2114112, 'steps': 11010, 'loss/train': 1.6063743829727173} +11/06/2021 22:46:29 - INFO - __main__ - Step 11012: {'lr': 0.0004954405990109897, 'samples': 2114304, 'steps': 11011, 'loss/train': 1.1053050756454468} +11/06/2021 22:46:30 - INFO - __main__ - Step 11013: {'lr': 0.0004954395900795611, 'samples': 2114496, 'steps': 11012, 'loss/train': 1.6776947975158691} +11/06/2021 22:46:30 - INFO - __main__ - Step 11014: {'lr': 0.0004954385810375415, 'samples': 2114688, 'steps': 11013, 'loss/train': 0.4628012776374817} +11/06/2021 22:46:31 - INFO - __main__ - Step 11015: {'lr': 0.0004954375718849308, 'samples': 2114880, 'steps': 11014, 'loss/train': 1.808875560760498} +11/06/2021 22:46:31 - INFO - __main__ - Step 11016: {'lr': 0.0004954365626217299, 'samples': 2115072, 'steps': 11015, 'loss/train': 1.8625273704528809} +11/06/2021 22:46:32 - INFO - __main__ - Step 11017: {'lr': 0.0004954355532479391, 'samples': 2115264, 'steps': 11016, 'loss/train': 1.388060450553894} +11/06/2021 22:46:32 - INFO - __main__ - Step 11018: {'lr': 0.0004954345437635587, 'samples': 2115456, 'steps': 11017, 'loss/train': 1.43634033203125} +11/06/2021 22:46:32 - INFO - __main__ - Step 11019: {'lr': 0.0004954335341685893, 'samples': 2115648, 'steps': 11018, 'loss/train': 1.6223043203353882} +11/06/2021 22:46:33 - INFO - __main__ - Step 11020: {'lr': 0.0004954325244630315, 'samples': 2115840, 'steps': 11019, 'loss/train': 1.9205574989318848} +11/06/2021 22:46:34 - INFO - __main__ - Step 11021: {'lr': 0.0004954315146468854, 'samples': 2116032, 'steps': 11020, 'loss/train': 2.2265076637268066} +11/06/2021 22:46:34 - INFO - __main__ - Step 11022: {'lr': 0.0004954305047201517, 'samples': 2116224, 'steps': 11021, 'loss/train': 1.7414882183074951} +11/06/2021 22:46:34 - INFO - __main__ - Step 11023: {'lr': 0.0004954294946828308, 'samples': 2116416, 'steps': 11022, 'loss/train': 2.187809944152832} +11/06/2021 22:46:35 - INFO - __main__ - Step 11024: {'lr': 0.0004954284845349232, 'samples': 2116608, 'steps': 11023, 'loss/train': 1.778928279876709} +11/06/2021 22:46:35 - INFO - __main__ - Step 11025: {'lr': 0.0004954274742764292, 'samples': 2116800, 'steps': 11024, 'loss/train': 1.018846869468689} +11/06/2021 22:46:36 - INFO - __main__ - Step 11026: {'lr': 0.0004954264639073495, 'samples': 2116992, 'steps': 11025, 'loss/train': 4.848390579223633} +11/06/2021 22:46:37 - INFO - __main__ - Step 11027: {'lr': 0.0004954254534276843, 'samples': 2117184, 'steps': 11026, 'loss/train': 1.92079496383667} +11/06/2021 22:46:37 - INFO - __main__ - Step 11028: {'lr': 0.0004954244428374343, 'samples': 2117376, 'steps': 11027, 'loss/train': 1.617121934890747} +11/06/2021 22:46:37 - INFO - __main__ - Step 11029: {'lr': 0.0004954234321365998, 'samples': 2117568, 'steps': 11028, 'loss/train': 2.104278087615967} +11/06/2021 22:46:38 - INFO - __main__ - Step 11030: {'lr': 0.0004954224213251813, 'samples': 2117760, 'steps': 11029, 'loss/train': 1.8662179708480835} +11/06/2021 22:46:39 - INFO - __main__ - Step 11031: {'lr': 0.0004954214104031791, 'samples': 2117952, 'steps': 11030, 'loss/train': 1.559154748916626} +11/06/2021 22:46:39 - INFO - __main__ - Step 11032: {'lr': 0.0004954203993705939, 'samples': 2118144, 'steps': 11031, 'loss/train': 1.7694008350372314} +11/06/2021 22:46:39 - INFO - __main__ - Step 11033: {'lr': 0.0004954193882274261, 'samples': 2118336, 'steps': 11032, 'loss/train': 1.8850313425064087} +11/06/2021 22:46:40 - INFO - __main__ - Step 11034: {'lr': 0.000495418376973676, 'samples': 2118528, 'steps': 11033, 'loss/train': 1.6931498050689697} +11/06/2021 22:46:40 - INFO - __main__ - Step 11035: {'lr': 0.0004954173656093443, 'samples': 2118720, 'steps': 11034, 'loss/train': 1.525468111038208} +11/06/2021 22:46:41 - INFO - __main__ - Step 11036: {'lr': 0.0004954163541344312, 'samples': 2118912, 'steps': 11035, 'loss/train': 1.5203142166137695} +11/06/2021 22:46:41 - INFO - __main__ - Step 11037: {'lr': 0.0004954153425489374, 'samples': 2119104, 'steps': 11036, 'loss/train': 1.7933595180511475} +11/06/2021 22:46:42 - INFO - __main__ - Step 11038: {'lr': 0.0004954143308528631, 'samples': 2119296, 'steps': 11037, 'loss/train': 1.0918980836868286} +11/06/2021 22:46:42 - INFO - __main__ - Step 11039: {'lr': 0.000495413319046209, 'samples': 2119488, 'steps': 11038, 'loss/train': 2.03767728805542} +11/06/2021 22:46:42 - INFO - __main__ - Step 11040: {'lr': 0.0004954123071289754, 'samples': 2119680, 'steps': 11039, 'loss/train': 1.9475619792938232} +11/06/2021 22:46:43 - INFO - __main__ - Step 11041: {'lr': 0.0004954112951011628, 'samples': 2119872, 'steps': 11040, 'loss/train': 1.5636467933654785} +11/06/2021 22:46:44 - INFO - __main__ - Step 11042: {'lr': 0.0004954102829627717, 'samples': 2120064, 'steps': 11041, 'loss/train': 2.0013155937194824} +11/06/2021 22:46:44 - INFO - __main__ - Step 11043: {'lr': 0.0004954092707138024, 'samples': 2120256, 'steps': 11042, 'loss/train': 1.427595853805542} +11/06/2021 22:46:44 - INFO - __main__ - Step 11044: {'lr': 0.0004954082583542557, 'samples': 2120448, 'steps': 11043, 'loss/train': 1.2948354482650757} +11/06/2021 22:46:45 - INFO - __main__ - Step 11045: {'lr': 0.0004954072458841315, 'samples': 2120640, 'steps': 11044, 'loss/train': 1.7006868124008179} +11/06/2021 22:46:46 - INFO - __main__ - Step 11046: {'lr': 0.0004954062333034308, 'samples': 2120832, 'steps': 11045, 'loss/train': 1.9174220561981201} +11/06/2021 22:46:46 - INFO - __main__ - Step 11047: {'lr': 0.0004954052206121538, 'samples': 2121024, 'steps': 11046, 'loss/train': 2.2105274200439453} +11/06/2021 22:46:47 - INFO - __main__ - Step 11048: {'lr': 0.000495404207810301, 'samples': 2121216, 'steps': 11047, 'loss/train': 1.7449531555175781} +11/06/2021 22:46:47 - INFO - __main__ - Step 11049: {'lr': 0.0004954031948978729, 'samples': 2121408, 'steps': 11048, 'loss/train': 1.3999689817428589} +11/06/2021 22:46:47 - INFO - __main__ - Step 11050: {'lr': 0.0004954021818748698, 'samples': 2121600, 'steps': 11049, 'loss/train': 2.2191524505615234} +11/06/2021 22:46:48 - INFO - __main__ - Step 11051: {'lr': 0.0004954011687412923, 'samples': 2121792, 'steps': 11050, 'loss/train': 1.5955177545547485} +11/06/2021 22:46:49 - INFO - __main__ - Step 11052: {'lr': 0.0004954001554971409, 'samples': 2121984, 'steps': 11051, 'loss/train': 1.4700356721878052} +11/06/2021 22:46:49 - INFO - __main__ - Step 11053: {'lr': 0.0004953991421424159, 'samples': 2122176, 'steps': 11052, 'loss/train': 1.7988489866256714} +11/06/2021 22:46:49 - INFO - __main__ - Step 11054: {'lr': 0.0004953981286771178, 'samples': 2122368, 'steps': 11053, 'loss/train': 0.8524397015571594} +11/06/2021 22:46:50 - INFO - __main__ - Step 11055: {'lr': 0.0004953971151012471, 'samples': 2122560, 'steps': 11054, 'loss/train': 1.956466794013977} +11/06/2021 22:46:51 - INFO - __main__ - Step 11056: {'lr': 0.0004953961014148043, 'samples': 2122752, 'steps': 11055, 'loss/train': 1.7897028923034668} +11/06/2021 22:46:51 - INFO - __main__ - Step 11057: {'lr': 0.0004953950876177897, 'samples': 2122944, 'steps': 11056, 'loss/train': 2.5609962940216064} +11/06/2021 22:46:51 - INFO - __main__ - Step 11058: {'lr': 0.000495394073710204, 'samples': 2123136, 'steps': 11057, 'loss/train': 1.6628973484039307} +11/06/2021 22:46:52 - INFO - __main__ - Step 11059: {'lr': 0.0004953930596920474, 'samples': 2123328, 'steps': 11058, 'loss/train': 0.9463735222816467} +11/06/2021 22:46:52 - INFO - __main__ - Step 11060: {'lr': 0.0004953920455633206, 'samples': 2123520, 'steps': 11059, 'loss/train': 1.7199558019638062} +11/06/2021 22:46:53 - INFO - __main__ - Step 11061: {'lr': 0.0004953910313240239, 'samples': 2123712, 'steps': 11060, 'loss/train': 2.0685226917266846} +11/06/2021 22:46:53 - INFO - __main__ - Step 11062: {'lr': 0.0004953900169741577, 'samples': 2123904, 'steps': 11061, 'loss/train': 1.852885127067566} +11/06/2021 22:46:54 - INFO - __main__ - Step 11063: {'lr': 0.0004953890025137226, 'samples': 2124096, 'steps': 11062, 'loss/train': 1.0211209058761597} +11/06/2021 22:46:54 - INFO - __main__ - Step 11064: {'lr': 0.000495387987942719, 'samples': 2124288, 'steps': 11063, 'loss/train': 1.8901044130325317} +11/06/2021 22:46:55 - INFO - __main__ - Step 11065: {'lr': 0.0004953869732611474, 'samples': 2124480, 'steps': 11064, 'loss/train': 1.3837004899978638} +11/06/2021 22:46:56 - INFO - __main__ - Step 11066: {'lr': 0.0004953859584690081, 'samples': 2124672, 'steps': 11065, 'loss/train': 1.3166968822479248} +11/06/2021 22:46:56 - INFO - __main__ - Step 11067: {'lr': 0.0004953849435663018, 'samples': 2124864, 'steps': 11066, 'loss/train': 1.1097654104232788} +11/06/2021 22:46:56 - INFO - __main__ - Step 11068: {'lr': 0.0004953839285530287, 'samples': 2125056, 'steps': 11067, 'loss/train': 1.8698753118515015} +11/06/2021 22:46:57 - INFO - __main__ - Step 11069: {'lr': 0.0004953829134291895, 'samples': 2125248, 'steps': 11068, 'loss/train': 2.0392954349517822} +11/06/2021 22:46:57 - INFO - __main__ - Step 11070: {'lr': 0.0004953818981947845, 'samples': 2125440, 'steps': 11069, 'loss/train': 1.821742057800293} +11/06/2021 22:46:58 - INFO - __main__ - Step 11071: {'lr': 0.0004953808828498142, 'samples': 2125632, 'steps': 11070, 'loss/train': 1.4613873958587646} +11/06/2021 22:46:58 - INFO - __main__ - Step 11072: {'lr': 0.0004953798673942791, 'samples': 2125824, 'steps': 11071, 'loss/train': 1.947845220565796} +11/06/2021 22:46:59 - INFO - __main__ - Step 11073: {'lr': 0.0004953788518281796, 'samples': 2126016, 'steps': 11072, 'loss/train': 2.3288230895996094} +11/06/2021 22:46:59 - INFO - __main__ - Step 11074: {'lr': 0.0004953778361515163, 'samples': 2126208, 'steps': 11073, 'loss/train': 1.7177420854568481} +11/06/2021 22:46:59 - INFO - __main__ - Step 11075: {'lr': 0.0004953768203642893, 'samples': 2126400, 'steps': 11074, 'loss/train': 1.5442180633544922} +11/06/2021 22:47:00 - INFO - __main__ - Step 11076: {'lr': 0.0004953758044664994, 'samples': 2126592, 'steps': 11075, 'loss/train': 2.2615766525268555} +11/06/2021 22:47:01 - INFO - __main__ - Step 11077: {'lr': 0.0004953747884581469, 'samples': 2126784, 'steps': 11076, 'loss/train': 2.156431198120117} +11/06/2021 22:47:01 - INFO - __main__ - Step 11078: {'lr': 0.0004953737723392324, 'samples': 2126976, 'steps': 11077, 'loss/train': 2.2842390537261963} +11/06/2021 22:47:01 - INFO - __main__ - Step 11079: {'lr': 0.0004953727561097562, 'samples': 2127168, 'steps': 11078, 'loss/train': 1.461220383644104} +11/06/2021 22:47:02 - INFO - __main__ - Step 11080: {'lr': 0.0004953717397697189, 'samples': 2127360, 'steps': 11079, 'loss/train': 1.6877996921539307} +11/06/2021 22:47:02 - INFO - __main__ - Step 11081: {'lr': 0.0004953707233191207, 'samples': 2127552, 'steps': 11080, 'loss/train': 1.1885510683059692} +11/06/2021 22:47:03 - INFO - __main__ - Step 11082: {'lr': 0.0004953697067579624, 'samples': 2127744, 'steps': 11081, 'loss/train': 1.5058166980743408} +11/06/2021 22:47:03 - INFO - __main__ - Step 11083: {'lr': 0.0004953686900862442, 'samples': 2127936, 'steps': 11082, 'loss/train': 1.6675527095794678} +11/06/2021 22:47:04 - INFO - __main__ - Step 11084: {'lr': 0.0004953676733039668, 'samples': 2128128, 'steps': 11083, 'loss/train': 1.9385559558868408} +11/06/2021 22:47:04 - INFO - __main__ - Step 11085: {'lr': 0.0004953666564111303, 'samples': 2128320, 'steps': 11084, 'loss/train': 1.6214722394943237} +11/06/2021 22:47:05 - INFO - __main__ - Step 11086: {'lr': 0.0004953656394077355, 'samples': 2128512, 'steps': 11085, 'loss/train': 1.1860450506210327} +11/06/2021 22:47:06 - INFO - __main__ - Step 11087: {'lr': 0.0004953646222937828, 'samples': 2128704, 'steps': 11086, 'loss/train': 1.8663421869277954} +11/06/2021 22:47:06 - INFO - __main__ - Step 11088: {'lr': 0.0004953636050692724, 'samples': 2128896, 'steps': 11087, 'loss/train': 1.5686103105545044} +11/06/2021 22:47:06 - INFO - __main__ - Step 11089: {'lr': 0.0004953625877342051, 'samples': 2129088, 'steps': 11088, 'loss/train': 1.8276753425598145} +11/06/2021 22:47:07 - INFO - __main__ - Step 11090: {'lr': 0.0004953615702885812, 'samples': 2129280, 'steps': 11089, 'loss/train': 1.5646089315414429} +11/06/2021 22:47:07 - INFO - __main__ - Step 11091: {'lr': 0.0004953605527324011, 'samples': 2129472, 'steps': 11090, 'loss/train': 1.7502714395523071} +11/06/2021 22:47:08 - INFO - __main__ - Step 11092: {'lr': 0.0004953595350656653, 'samples': 2129664, 'steps': 11091, 'loss/train': 1.3079643249511719} +11/06/2021 22:47:08 - INFO - __main__ - Step 11093: {'lr': 0.0004953585172883743, 'samples': 2129856, 'steps': 11092, 'loss/train': 1.8320194482803345} +11/06/2021 22:47:09 - INFO - __main__ - Step 11094: {'lr': 0.0004953574994005286, 'samples': 2130048, 'steps': 11093, 'loss/train': 1.7098597288131714} +11/06/2021 22:47:09 - INFO - __main__ - Step 11095: {'lr': 0.0004953564814021285, 'samples': 2130240, 'steps': 11094, 'loss/train': 1.9974864721298218} +11/06/2021 22:47:09 - INFO - __main__ - Step 11096: {'lr': 0.0004953554632931746, 'samples': 2130432, 'steps': 11095, 'loss/train': 1.8548189401626587} +11/06/2021 22:47:10 - INFO - __main__ - Step 11097: {'lr': 0.0004953544450736674, 'samples': 2130624, 'steps': 11096, 'loss/train': 1.8645987510681152} +11/06/2021 22:47:11 - INFO - __main__ - Step 11098: {'lr': 0.0004953534267436072, 'samples': 2130816, 'steps': 11097, 'loss/train': 2.160127878189087} +11/06/2021 22:47:11 - INFO - __main__ - Step 11099: {'lr': 0.0004953524083029945, 'samples': 2131008, 'steps': 11098, 'loss/train': 2.143897533416748} +11/06/2021 22:47:11 - INFO - __main__ - Step 11100: {'lr': 0.0004953513897518298, 'samples': 2131200, 'steps': 11099, 'loss/train': 1.7265970706939697} +11/06/2021 22:47:12 - INFO - __main__ - Step 11101: {'lr': 0.0004953503710901136, 'samples': 2131392, 'steps': 11100, 'loss/train': 1.6248968839645386} +11/06/2021 22:47:13 - INFO - __main__ - Step 11102: {'lr': 0.0004953493523178463, 'samples': 2131584, 'steps': 11101, 'loss/train': 1.7727121114730835} +11/06/2021 22:47:13 - INFO - __main__ - Step 11103: {'lr': 0.0004953483334350283, 'samples': 2131776, 'steps': 11102, 'loss/train': 1.5690078735351562} +11/06/2021 22:47:13 - INFO - __main__ - Step 11104: {'lr': 0.0004953473144416602, 'samples': 2131968, 'steps': 11103, 'loss/train': 1.7810686826705933} +11/06/2021 22:47:14 - INFO - __main__ - Step 11105: {'lr': 0.0004953462953377424, 'samples': 2132160, 'steps': 11104, 'loss/train': 1.8869816064834595} +11/06/2021 22:47:14 - INFO - __main__ - Step 11106: {'lr': 0.0004953452761232753, 'samples': 2132352, 'steps': 11105, 'loss/train': 2.1093719005584717} +11/06/2021 22:47:15 - INFO - __main__ - Step 11107: {'lr': 0.0004953442567982593, 'samples': 2132544, 'steps': 11106, 'loss/train': 1.606833815574646} +11/06/2021 22:47:15 - INFO - __main__ - Step 11108: {'lr': 0.0004953432373626951, 'samples': 2132736, 'steps': 11107, 'loss/train': 1.9414929151535034} +11/06/2021 22:47:16 - INFO - __main__ - Step 11109: {'lr': 0.0004953422178165831, 'samples': 2132928, 'steps': 11108, 'loss/train': 1.8882904052734375} +11/06/2021 22:47:16 - INFO - __main__ - Step 11110: {'lr': 0.0004953411981599235, 'samples': 2133120, 'steps': 11109, 'loss/train': 1.7762526273727417} +11/06/2021 22:47:17 - INFO - __main__ - Step 11111: {'lr': 0.0004953401783927171, 'samples': 2133312, 'steps': 11110, 'loss/train': 1.9979164600372314} +11/06/2021 22:47:17 - INFO - __main__ - Step 11112: {'lr': 0.000495339158514964, 'samples': 2133504, 'steps': 11111, 'loss/train': 1.818439245223999} +11/06/2021 22:47:18 - INFO - __main__ - Step 11113: {'lr': 0.0004953381385266651, 'samples': 2133696, 'steps': 11112, 'loss/train': 1.8462194204330444} +11/06/2021 22:47:18 - INFO - __main__ - Step 11114: {'lr': 0.0004953371184278205, 'samples': 2133888, 'steps': 11113, 'loss/train': 1.7984886169433594} +11/06/2021 22:47:19 - INFO - __main__ - Step 11115: {'lr': 0.0004953360982184308, 'samples': 2134080, 'steps': 11114, 'loss/train': 2.2713496685028076} +11/06/2021 22:47:19 - INFO - __main__ - Step 11116: {'lr': 0.0004953350778984963, 'samples': 2134272, 'steps': 11115, 'loss/train': 1.8427363634109497} +11/06/2021 22:47:19 - INFO - __main__ - Step 11117: {'lr': 0.0004953340574680177, 'samples': 2134464, 'steps': 11116, 'loss/train': 1.2288328409194946} +11/06/2021 22:47:20 - INFO - __main__ - Step 11118: {'lr': 0.0004953330369269955, 'samples': 2134656, 'steps': 11117, 'loss/train': 1.9006093740463257} +11/06/2021 22:47:21 - INFO - __main__ - Step 11119: {'lr': 0.0004953320162754298, 'samples': 2134848, 'steps': 11118, 'loss/train': 1.618245244026184} +11/06/2021 22:47:21 - INFO - __main__ - Step 11120: {'lr': 0.0004953309955133214, 'samples': 2135040, 'steps': 11119, 'loss/train': 1.8152966499328613} +11/06/2021 22:47:22 - INFO - __main__ - Step 11121: {'lr': 0.0004953299746406707, 'samples': 2135232, 'steps': 11120, 'loss/train': 1.3982417583465576} +11/06/2021 22:47:22 - INFO - __main__ - Step 11122: {'lr': 0.000495328953657478, 'samples': 2135424, 'steps': 11121, 'loss/train': 1.8065004348754883} +11/06/2021 22:47:23 - INFO - __main__ - Step 11123: {'lr': 0.0004953279325637438, 'samples': 2135616, 'steps': 11122, 'loss/train': 1.807936191558838} +11/06/2021 22:47:23 - INFO - __main__ - Step 11124: {'lr': 0.0004953269113594687, 'samples': 2135808, 'steps': 11123, 'loss/train': 1.684847116470337} +11/06/2021 22:47:24 - INFO - __main__ - Step 11125: {'lr': 0.0004953258900446531, 'samples': 2136000, 'steps': 11124, 'loss/train': 1.3972996473312378} +11/06/2021 22:47:24 - INFO - __main__ - Step 11126: {'lr': 0.0004953248686192975, 'samples': 2136192, 'steps': 11125, 'loss/train': 1.6219148635864258} +11/06/2021 22:47:24 - INFO - __main__ - Step 11127: {'lr': 0.0004953238470834022, 'samples': 2136384, 'steps': 11126, 'loss/train': 0.5669246912002563} +11/06/2021 22:47:25 - INFO - __main__ - Step 11128: {'lr': 0.0004953228254369677, 'samples': 2136576, 'steps': 11127, 'loss/train': 1.5386314392089844} +11/06/2021 22:47:26 - INFO - __main__ - Step 11129: {'lr': 0.0004953218036799946, 'samples': 2136768, 'steps': 11128, 'loss/train': 1.7558674812316895} +11/06/2021 22:47:26 - INFO - __main__ - Step 11130: {'lr': 0.0004953207818124833, 'samples': 2136960, 'steps': 11129, 'loss/train': 1.2307705879211426} +11/06/2021 22:47:26 - INFO - __main__ - Step 11131: {'lr': 0.0004953197598344342, 'samples': 2137152, 'steps': 11130, 'loss/train': 2.116920232772827} +11/06/2021 22:47:27 - INFO - __main__ - Step 11132: {'lr': 0.0004953187377458478, 'samples': 2137344, 'steps': 11131, 'loss/train': 2.0362181663513184} +11/06/2021 22:47:28 - INFO - __main__ - Step 11133: {'lr': 0.0004953177155467246, 'samples': 2137536, 'steps': 11132, 'loss/train': 1.7032719850540161} +11/06/2021 22:47:28 - INFO - __main__ - Step 11134: {'lr': 0.0004953166932370651, 'samples': 2137728, 'steps': 11133, 'loss/train': 1.8138678073883057} +11/06/2021 22:47:28 - INFO - __main__ - Step 11135: {'lr': 0.0004953156708168695, 'samples': 2137920, 'steps': 11134, 'loss/train': 1.8151832818984985} +11/06/2021 22:47:29 - INFO - __main__ - Step 11136: {'lr': 0.0004953146482861385, 'samples': 2138112, 'steps': 11135, 'loss/train': 1.7565672397613525} +11/06/2021 22:47:29 - INFO - __main__ - Step 11137: {'lr': 0.0004953136256448725, 'samples': 2138304, 'steps': 11136, 'loss/train': 1.687888741493225} +11/06/2021 22:47:29 - INFO - __main__ - Step 11138: {'lr': 0.0004953126028930721, 'samples': 2138496, 'steps': 11137, 'loss/train': 1.2880886793136597} +11/06/2021 22:47:31 - INFO - __main__ - Step 11139: {'lr': 0.0004953115800307375, 'samples': 2138688, 'steps': 11138, 'loss/train': 1.8301455974578857} +11/06/2021 22:47:31 - INFO - __main__ - Step 11140: {'lr': 0.0004953105570578693, 'samples': 2138880, 'steps': 11139, 'loss/train': 1.5267943143844604} +11/06/2021 22:47:31 - INFO - __main__ - Step 11141: {'lr': 0.000495309533974468, 'samples': 2139072, 'steps': 11140, 'loss/train': 1.7597218751907349} +11/06/2021 22:47:32 - INFO - __main__ - Step 11142: {'lr': 0.0004953085107805339, 'samples': 2139264, 'steps': 11141, 'loss/train': 0.6988817453384399} +11/06/2021 22:47:32 - INFO - __main__ - Step 11143: {'lr': 0.0004953074874760677, 'samples': 2139456, 'steps': 11142, 'loss/train': 1.4152743816375732} +11/06/2021 22:47:33 - INFO - __main__ - Step 11144: {'lr': 0.0004953064640610697, 'samples': 2139648, 'steps': 11143, 'loss/train': 1.5432703495025635} +11/06/2021 22:47:33 - INFO - __main__ - Step 11145: {'lr': 0.0004953054405355404, 'samples': 2139840, 'steps': 11144, 'loss/train': 2.103456735610962} +11/06/2021 22:47:34 - INFO - __main__ - Step 11146: {'lr': 0.0004953044168994802, 'samples': 2140032, 'steps': 11145, 'loss/train': 1.8357820510864258} +11/06/2021 22:47:34 - INFO - __main__ - Step 11147: {'lr': 0.0004953033931528897, 'samples': 2140224, 'steps': 11146, 'loss/train': 1.426553726196289} +11/06/2021 22:47:34 - INFO - __main__ - Step 11148: {'lr': 0.0004953023692957691, 'samples': 2140416, 'steps': 11147, 'loss/train': 0.9832262992858887} +11/06/2021 22:47:35 - INFO - __main__ - Step 11149: {'lr': 0.0004953013453281193, 'samples': 2140608, 'steps': 11148, 'loss/train': 2.1371872425079346} +11/06/2021 22:47:36 - INFO - __main__ - Step 11150: {'lr': 0.0004953003212499403, 'samples': 2140800, 'steps': 11149, 'loss/train': 2.0583853721618652} +11/06/2021 22:47:36 - INFO - __main__ - Step 11151: {'lr': 0.0004952992970612328, 'samples': 2140992, 'steps': 11150, 'loss/train': 1.6691161394119263} +11/06/2021 22:47:36 - INFO - __main__ - Step 11152: {'lr': 0.0004952982727619973, 'samples': 2141184, 'steps': 11151, 'loss/train': 1.672674298286438} +11/06/2021 22:47:37 - INFO - __main__ - Step 11153: {'lr': 0.000495297248352234, 'samples': 2141376, 'steps': 11152, 'loss/train': 0.8161516785621643} +11/06/2021 22:47:38 - INFO - __main__ - Step 11154: {'lr': 0.0004952962238319436, 'samples': 2141568, 'steps': 11153, 'loss/train': 1.0644028186798096} +11/06/2021 22:47:38 - INFO - __main__ - Step 11155: {'lr': 0.0004952951992011266, 'samples': 2141760, 'steps': 11154, 'loss/train': 1.5536161661148071} +11/06/2021 22:47:39 - INFO - __main__ - Step 11156: {'lr': 0.0004952941744597834, 'samples': 2141952, 'steps': 11155, 'loss/train': 1.6991686820983887} +11/06/2021 22:47:39 - INFO - __main__ - Step 11157: {'lr': 0.0004952931496079143, 'samples': 2142144, 'steps': 11156, 'loss/train': 1.9701721668243408} +11/06/2021 22:47:39 - INFO - __main__ - Step 11158: {'lr': 0.00049529212464552, 'samples': 2142336, 'steps': 11157, 'loss/train': 1.5034873485565186} +11/06/2021 22:47:40 - INFO - __main__ - Step 11159: {'lr': 0.0004952910995726008, 'samples': 2142528, 'steps': 11158, 'loss/train': 1.8932499885559082} +11/06/2021 22:47:41 - INFO - __main__ - Step 11160: {'lr': 0.0004952900743891573, 'samples': 2142720, 'steps': 11159, 'loss/train': 1.5492379665374756} +11/06/2021 22:47:41 - INFO - __main__ - Step 11161: {'lr': 0.0004952890490951898, 'samples': 2142912, 'steps': 11160, 'loss/train': 1.9090741872787476} +11/06/2021 22:47:41 - INFO - __main__ - Step 11162: {'lr': 0.0004952880236906988, 'samples': 2143104, 'steps': 11161, 'loss/train': 1.2465680837631226} +11/06/2021 22:47:42 - INFO - __main__ - Step 11163: {'lr': 0.0004952869981756848, 'samples': 2143296, 'steps': 11162, 'loss/train': 1.629738450050354} +11/06/2021 22:47:42 - INFO - __main__ - Step 11164: {'lr': 0.0004952859725501484, 'samples': 2143488, 'steps': 11163, 'loss/train': 1.934152364730835} +11/06/2021 22:47:43 - INFO - __main__ - Step 11165: {'lr': 0.0004952849468140898, 'samples': 2143680, 'steps': 11164, 'loss/train': 1.5853830575942993} +11/06/2021 22:47:43 - INFO - __main__ - Step 11166: {'lr': 0.0004952839209675096, 'samples': 2143872, 'steps': 11165, 'loss/train': 1.383769154548645} +11/06/2021 22:47:44 - INFO - __main__ - Step 11167: {'lr': 0.0004952828950104083, 'samples': 2144064, 'steps': 11166, 'loss/train': 1.3340117931365967} +11/06/2021 22:47:44 - INFO - __main__ - Step 11168: {'lr': 0.0004952818689427863, 'samples': 2144256, 'steps': 11167, 'loss/train': 1.787481665611267} +11/06/2021 22:47:44 - INFO - __main__ - Step 11169: {'lr': 0.0004952808427646441, 'samples': 2144448, 'steps': 11168, 'loss/train': 1.6143748760223389} +11/06/2021 22:47:45 - INFO - __main__ - Step 11170: {'lr': 0.000495279816475982, 'samples': 2144640, 'steps': 11169, 'loss/train': 1.741720199584961} +11/06/2021 22:47:46 - INFO - __main__ - Step 11171: {'lr': 0.0004952787900768008, 'samples': 2144832, 'steps': 11170, 'loss/train': 1.8251887559890747} +11/06/2021 22:47:46 - INFO - __main__ - Step 11172: {'lr': 0.0004952777635671006, 'samples': 2145024, 'steps': 11171, 'loss/train': 2.326918125152588} +11/06/2021 22:47:46 - INFO - __main__ - Step 11173: {'lr': 0.0004952767369468821, 'samples': 2145216, 'steps': 11172, 'loss/train': 1.6599018573760986} +11/06/2021 22:47:47 - INFO - __main__ - Step 11174: {'lr': 0.0004952757102161457, 'samples': 2145408, 'steps': 11173, 'loss/train': 1.3439342975616455} +11/06/2021 22:47:48 - INFO - __main__ - Step 11175: {'lr': 0.0004952746833748918, 'samples': 2145600, 'steps': 11174, 'loss/train': 1.5779838562011719} +11/06/2021 22:47:48 - INFO - __main__ - Step 11176: {'lr': 0.0004952736564231209, 'samples': 2145792, 'steps': 11175, 'loss/train': 1.711625099182129} +11/06/2021 22:47:49 - INFO - __main__ - Step 11177: {'lr': 0.0004952726293608335, 'samples': 2145984, 'steps': 11176, 'loss/train': 1.7261056900024414} +11/06/2021 22:47:49 - INFO - __main__ - Step 11178: {'lr': 0.0004952716021880301, 'samples': 2146176, 'steps': 11177, 'loss/train': 2.207341194152832} +11/06/2021 22:47:49 - INFO - __main__ - Step 11179: {'lr': 0.0004952705749047111, 'samples': 2146368, 'steps': 11178, 'loss/train': 1.6642247438430786} +11/06/2021 22:47:50 - INFO - __main__ - Step 11180: {'lr': 0.0004952695475108768, 'samples': 2146560, 'steps': 11179, 'loss/train': 1.309320092201233} +11/06/2021 22:47:51 - INFO - __main__ - Step 11181: {'lr': 0.000495268520006528, 'samples': 2146752, 'steps': 11180, 'loss/train': 1.2601646184921265} +11/06/2021 22:47:51 - INFO - __main__ - Step 11182: {'lr': 0.000495267492391665, 'samples': 2146944, 'steps': 11181, 'loss/train': 1.730563759803772} +11/06/2021 22:47:52 - INFO - __main__ - Step 11183: {'lr': 0.0004952664646662882, 'samples': 2147136, 'steps': 11182, 'loss/train': 1.8496640920639038} +11/06/2021 22:47:52 - INFO - __main__ - Step 11184: {'lr': 0.000495265436830398, 'samples': 2147328, 'steps': 11183, 'loss/train': 1.282710075378418} +11/06/2021 22:47:52 - INFO - __main__ - Step 11185: {'lr': 0.0004952644088839951, 'samples': 2147520, 'steps': 11184, 'loss/train': 0.9519102573394775} +11/06/2021 22:47:54 - INFO - __main__ - Step 11186: {'lr': 0.0004952633808270797, 'samples': 2147712, 'steps': 11185, 'loss/train': 2.1716973781585693} +11/06/2021 22:47:54 - INFO - __main__ - Step 11187: {'lr': 0.0004952623526596526, 'samples': 2147904, 'steps': 11186, 'loss/train': 1.5648038387298584} +11/06/2021 22:47:54 - INFO - __main__ - Step 11188: {'lr': 0.000495261324381714, 'samples': 2148096, 'steps': 11187, 'loss/train': 1.8554600477218628} +11/06/2021 22:47:55 - INFO - __main__ - Step 11189: {'lr': 0.0004952602959932644, 'samples': 2148288, 'steps': 11188, 'loss/train': 0.2998165488243103} +11/06/2021 22:47:55 - INFO - __main__ - Step 11190: {'lr': 0.0004952592674943043, 'samples': 2148480, 'steps': 11189, 'loss/train': 1.513887882232666} +11/06/2021 22:47:56 - INFO - __main__ - Step 11191: {'lr': 0.0004952582388848343, 'samples': 2148672, 'steps': 11190, 'loss/train': 1.61158287525177} +11/06/2021 22:47:56 - INFO - __main__ - Step 11192: {'lr': 0.0004952572101648545, 'samples': 2148864, 'steps': 11191, 'loss/train': 1.4567087888717651} +11/06/2021 22:47:57 - INFO - __main__ - Step 11193: {'lr': 0.0004952561813343657, 'samples': 2149056, 'steps': 11192, 'loss/train': 1.598156452178955} +11/06/2021 22:47:57 - INFO - __main__ - Step 11194: {'lr': 0.0004952551523933682, 'samples': 2149248, 'steps': 11193, 'loss/train': 2.243593692779541} +11/06/2021 22:47:58 - INFO - __main__ - Step 11195: {'lr': 0.0004952541233418626, 'samples': 2149440, 'steps': 11194, 'loss/train': 1.6861417293548584} +11/06/2021 22:47:59 - INFO - __main__ - Step 11196: {'lr': 0.0004952530941798492, 'samples': 2149632, 'steps': 11195, 'loss/train': 1.3837568759918213} +11/06/2021 22:47:59 - INFO - __main__ - Step 11197: {'lr': 0.0004952520649073286, 'samples': 2149824, 'steps': 11196, 'loss/train': 1.8483117818832397} +11/06/2021 22:47:59 - INFO - __main__ - Step 11198: {'lr': 0.0004952510355243012, 'samples': 2150016, 'steps': 11197, 'loss/train': 1.94416081905365} +11/06/2021 22:48:00 - INFO - __main__ - Step 11199: {'lr': 0.0004952500060307674, 'samples': 2150208, 'steps': 11198, 'loss/train': 1.9236924648284912} +11/06/2021 22:48:00 - INFO - __main__ - Step 11200: {'lr': 0.0004952489764267278, 'samples': 2150400, 'steps': 11199, 'loss/train': 2.271418333053589} +11/06/2021 22:48:01 - INFO - __main__ - Step 11201: {'lr': 0.0004952479467121827, 'samples': 2150592, 'steps': 11200, 'loss/train': 1.6901092529296875} +11/06/2021 22:48:01 - INFO - __main__ - Step 11202: {'lr': 0.0004952469168871327, 'samples': 2150784, 'steps': 11201, 'loss/train': 1.9666694402694702} +11/06/2021 22:48:02 - INFO - __main__ - Step 11203: {'lr': 0.0004952458869515782, 'samples': 2150976, 'steps': 11202, 'loss/train': 1.9771145582199097} +11/06/2021 22:48:02 - INFO - __main__ - Step 11204: {'lr': 0.0004952448569055198, 'samples': 2151168, 'steps': 11203, 'loss/train': 1.4397884607315063} +11/06/2021 22:48:02 - INFO - __main__ - Step 11205: {'lr': 0.0004952438267489578, 'samples': 2151360, 'steps': 11204, 'loss/train': 1.73050856590271} +11/06/2021 22:48:03 - INFO - __main__ - Step 11206: {'lr': 0.0004952427964818927, 'samples': 2151552, 'steps': 11205, 'loss/train': 1.7064839601516724} +11/06/2021 22:48:04 - INFO - __main__ - Step 11207: {'lr': 0.0004952417661043249, 'samples': 2151744, 'steps': 11206, 'loss/train': 1.7774326801300049} +11/06/2021 22:48:04 - INFO - __main__ - Step 11208: {'lr': 0.0004952407356162551, 'samples': 2151936, 'steps': 11207, 'loss/train': 1.5006650686264038} +11/06/2021 22:48:04 - INFO - __main__ - Step 11209: {'lr': 0.0004952397050176835, 'samples': 2152128, 'steps': 11208, 'loss/train': 1.9831914901733398} +11/06/2021 22:48:05 - INFO - __main__ - Step 11210: {'lr': 0.0004952386743086107, 'samples': 2152320, 'steps': 11209, 'loss/train': 1.5023480653762817} +11/06/2021 22:48:05 - INFO - __main__ - Step 11211: {'lr': 0.0004952376434890372, 'samples': 2152512, 'steps': 11210, 'loss/train': 1.4154393672943115} +11/06/2021 22:48:06 - INFO - __main__ - Step 11212: {'lr': 0.0004952366125589633, 'samples': 2152704, 'steps': 11211, 'loss/train': 1.498394250869751} +11/06/2021 22:48:07 - INFO - __main__ - Step 11213: {'lr': 0.0004952355815183897, 'samples': 2152896, 'steps': 11212, 'loss/train': 1.85457444190979} +11/06/2021 22:48:07 - INFO - __main__ - Step 11214: {'lr': 0.0004952345503673166, 'samples': 2153088, 'steps': 11213, 'loss/train': 1.908733606338501} +11/06/2021 22:48:07 - INFO - __main__ - Step 11215: {'lr': 0.0004952335191057447, 'samples': 2153280, 'steps': 11214, 'loss/train': 1.707075834274292} +11/06/2021 22:48:08 - INFO - __main__ - Step 11216: {'lr': 0.0004952324877336743, 'samples': 2153472, 'steps': 11215, 'loss/train': 1.5228673219680786} +11/06/2021 22:48:09 - INFO - __main__ - Step 11217: {'lr': 0.0004952314562511059, 'samples': 2153664, 'steps': 11216, 'loss/train': 2.17525053024292} +11/06/2021 22:48:09 - INFO - __main__ - Step 11218: {'lr': 0.00049523042465804, 'samples': 2153856, 'steps': 11217, 'loss/train': 1.8961803913116455} +11/06/2021 22:48:09 - INFO - __main__ - Step 11219: {'lr': 0.0004952293929544771, 'samples': 2154048, 'steps': 11218, 'loss/train': 1.9099823236465454} +11/06/2021 22:48:10 - INFO - __main__ - Step 11220: {'lr': 0.0004952283611404176, 'samples': 2154240, 'steps': 11219, 'loss/train': 1.5863221883773804} +11/06/2021 22:48:10 - INFO - __main__ - Step 11221: {'lr': 0.0004952273292158619, 'samples': 2154432, 'steps': 11220, 'loss/train': 1.5212019681930542} +11/06/2021 22:48:11 - INFO - __main__ - Step 11222: {'lr': 0.0004952262971808106, 'samples': 2154624, 'steps': 11221, 'loss/train': 1.0951485633850098} +11/06/2021 22:48:11 - INFO - __main__ - Step 11223: {'lr': 0.0004952252650352642, 'samples': 2154816, 'steps': 11222, 'loss/train': 1.8635188341140747} +11/06/2021 22:48:12 - INFO - __main__ - Step 11224: {'lr': 0.000495224232779223, 'samples': 2155008, 'steps': 11223, 'loss/train': 1.7595049142837524} +11/06/2021 22:48:12 - INFO - __main__ - Step 11225: {'lr': 0.0004952232004126876, 'samples': 2155200, 'steps': 11224, 'loss/train': 1.5507785081863403} +11/06/2021 22:48:12 - INFO - __main__ - Step 11226: {'lr': 0.0004952221679356583, 'samples': 2155392, 'steps': 11225, 'loss/train': 1.63408625125885} +11/06/2021 22:48:13 - INFO - __main__ - Step 11227: {'lr': 0.0004952211353481358, 'samples': 2155584, 'steps': 11226, 'loss/train': 1.6727948188781738} +11/06/2021 22:48:14 - INFO - __main__ - Step 11228: {'lr': 0.0004952201026501204, 'samples': 2155776, 'steps': 11227, 'loss/train': 1.2963249683380127} +11/06/2021 22:48:14 - INFO - __main__ - Step 11229: {'lr': 0.0004952190698416126, 'samples': 2155968, 'steps': 11228, 'loss/train': 1.5582791566848755} +11/06/2021 22:48:14 - INFO - __main__ - Step 11230: {'lr': 0.0004952180369226129, 'samples': 2156160, 'steps': 11229, 'loss/train': 2.1736087799072266} +11/06/2021 22:48:15 - INFO - __main__ - Step 11231: {'lr': 0.0004952170038931217, 'samples': 2156352, 'steps': 11230, 'loss/train': 1.376936912536621} +11/06/2021 22:48:15 - INFO - __main__ - Step 11232: {'lr': 0.0004952159707531395, 'samples': 2156544, 'steps': 11231, 'loss/train': 1.1369280815124512} +11/06/2021 22:48:17 - INFO - __main__ - Step 11233: {'lr': 0.0004952149375026668, 'samples': 2156736, 'steps': 11232, 'loss/train': 1.7504469156265259} +11/06/2021 22:48:17 - INFO - __main__ - Step 11234: {'lr': 0.000495213904141704, 'samples': 2156928, 'steps': 11233, 'loss/train': 1.4631931781768799} +11/06/2021 22:48:17 - INFO - __main__ - Step 11235: {'lr': 0.0004952128706702516, 'samples': 2157120, 'steps': 11234, 'loss/train': 2.062126636505127} +11/06/2021 22:48:18 - INFO - __main__ - Step 11236: {'lr': 0.0004952118370883101, 'samples': 2157312, 'steps': 11235, 'loss/train': 2.1615216732025146} +11/06/2021 22:48:18 - INFO - __main__ - Step 11237: {'lr': 0.0004952108033958798, 'samples': 2157504, 'steps': 11236, 'loss/train': 2.1354172229766846} +11/06/2021 22:48:19 - INFO - __main__ - Step 11238: {'lr': 0.0004952097695929614, 'samples': 2157696, 'steps': 11237, 'loss/train': 1.028824806213379} +11/06/2021 22:48:19 - INFO - __main__ - Step 11239: {'lr': 0.0004952087356795553, 'samples': 2157888, 'steps': 11238, 'loss/train': 1.6951218843460083} +11/06/2021 22:48:20 - INFO - __main__ - Step 11240: {'lr': 0.0004952077016556619, 'samples': 2158080, 'steps': 11239, 'loss/train': 1.766661524772644} +11/06/2021 22:48:20 - INFO - __main__ - Step 11241: {'lr': 0.0004952066675212816, 'samples': 2158272, 'steps': 11240, 'loss/train': 1.3343703746795654} +11/06/2021 22:48:20 - INFO - __main__ - Step 11242: {'lr': 0.0004952056332764151, 'samples': 2158464, 'steps': 11241, 'loss/train': 1.303107500076294} +11/06/2021 22:48:21 - INFO - __main__ - Step 11243: {'lr': 0.0004952045989210627, 'samples': 2158656, 'steps': 11242, 'loss/train': 1.767581820487976} +11/06/2021 22:48:22 - INFO - __main__ - Step 11244: {'lr': 0.0004952035644552249, 'samples': 2158848, 'steps': 11243, 'loss/train': 1.4197368621826172} +11/06/2021 22:48:22 - INFO - __main__ - Step 11245: {'lr': 0.000495202529878902, 'samples': 2159040, 'steps': 11244, 'loss/train': 1.4061685800552368} +11/06/2021 22:48:22 - INFO - __main__ - Step 11246: {'lr': 0.0004952014951920948, 'samples': 2159232, 'steps': 11245, 'loss/train': 2.45194673538208} +11/06/2021 22:48:23 - INFO - __main__ - Step 11247: {'lr': 0.0004952004603948034, 'samples': 2159424, 'steps': 11246, 'loss/train': 2.113942861557007} +11/06/2021 22:48:24 - INFO - __main__ - Step 11248: {'lr': 0.0004951994254870286, 'samples': 2159616, 'steps': 11247, 'loss/train': 1.3976362943649292} +11/06/2021 22:48:24 - INFO - __main__ - Step 11249: {'lr': 0.0004951983904687708, 'samples': 2159808, 'steps': 11248, 'loss/train': 1.9836783409118652} +11/06/2021 22:48:24 - INFO - __main__ - Step 11250: {'lr': 0.0004951973553400303, 'samples': 2160000, 'steps': 11249, 'loss/train': 2.1718714237213135} +11/06/2021 22:48:25 - INFO - __main__ - Step 11251: {'lr': 0.0004951963201008077, 'samples': 2160192, 'steps': 11250, 'loss/train': 1.9737859964370728} +11/06/2021 22:48:25 - INFO - __main__ - Step 11252: {'lr': 0.0004951952847511033, 'samples': 2160384, 'steps': 11251, 'loss/train': 1.3120644092559814} +11/06/2021 22:48:25 - INFO - __main__ - Step 11253: {'lr': 0.0004951942492909177, 'samples': 2160576, 'steps': 11252, 'loss/train': 1.7218273878097534} +11/06/2021 22:48:26 - INFO - __main__ - Step 11254: {'lr': 0.0004951932137202515, 'samples': 2160768, 'steps': 11253, 'loss/train': 1.8016955852508545} +11/06/2021 22:48:27 - INFO - __main__ - Step 11255: {'lr': 0.0004951921780391049, 'samples': 2160960, 'steps': 11254, 'loss/train': 1.4004523754119873} +11/06/2021 22:48:27 - INFO - __main__ - Step 11256: {'lr': 0.0004951911422474785, 'samples': 2161152, 'steps': 11255, 'loss/train': 1.1996997594833374} +11/06/2021 22:48:28 - INFO - __main__ - Step 11257: {'lr': 0.0004951901063453728, 'samples': 2161344, 'steps': 11256, 'loss/train': 1.6938501596450806} +11/06/2021 22:48:28 - INFO - __main__ - Step 11258: {'lr': 0.0004951890703327883, 'samples': 2161536, 'steps': 11257, 'loss/train': 1.6818426847457886} +11/06/2021 22:48:29 - INFO - __main__ - Step 11259: {'lr': 0.0004951880342097251, 'samples': 2161728, 'steps': 11258, 'loss/train': 1.2888652086257935} +11/06/2021 22:48:29 - INFO - __main__ - Step 11260: {'lr': 0.0004951869979761842, 'samples': 2161920, 'steps': 11259, 'loss/train': 1.692081332206726} +11/06/2021 22:48:30 - INFO - __main__ - Step 11261: {'lr': 0.0004951859616321658, 'samples': 2162112, 'steps': 11260, 'loss/train': 1.8977314233779907} +11/06/2021 22:48:30 - INFO - __main__ - Step 11262: {'lr': 0.0004951849251776703, 'samples': 2162304, 'steps': 11261, 'loss/train': 3.5356547832489014} +11/06/2021 22:48:30 - INFO - __main__ - Step 11263: {'lr': 0.0004951838886126983, 'samples': 2162496, 'steps': 11262, 'loss/train': 1.3212937116622925} +11/06/2021 22:48:31 - INFO - __main__ - Step 11264: {'lr': 0.0004951828519372503, 'samples': 2162688, 'steps': 11263, 'loss/train': 1.470284104347229} +11/06/2021 22:48:32 - INFO - __main__ - Step 11265: {'lr': 0.0004951818151513267, 'samples': 2162880, 'steps': 11264, 'loss/train': 1.6359577178955078} +11/06/2021 22:48:32 - INFO - __main__ - Step 11266: {'lr': 0.0004951807782549277, 'samples': 2163072, 'steps': 11265, 'loss/train': 1.4494744539260864} +11/06/2021 22:48:32 - INFO - __main__ - Step 11267: {'lr': 0.0004951797412480544, 'samples': 2163264, 'steps': 11266, 'loss/train': 1.7457062005996704} +11/06/2021 22:48:33 - INFO - __main__ - Step 11268: {'lr': 0.0004951787041307066, 'samples': 2163456, 'steps': 11267, 'loss/train': 1.7130874395370483} +11/06/2021 22:48:34 - INFO - __main__ - Step 11269: {'lr': 0.0004951776669028851, 'samples': 2163648, 'steps': 11268, 'loss/train': 1.1853411197662354} +11/06/2021 22:48:34 - INFO - __main__ - Step 11270: {'lr': 0.0004951766295645904, 'samples': 2163840, 'steps': 11269, 'loss/train': 0.6745047569274902} +11/06/2021 22:48:34 - INFO - __main__ - Step 11271: {'lr': 0.000495175592115823, 'samples': 2164032, 'steps': 11270, 'loss/train': 2.009004592895508} +11/06/2021 22:48:35 - INFO - __main__ - Step 11272: {'lr': 0.0004951745545565831, 'samples': 2164224, 'steps': 11271, 'loss/train': 1.5138862133026123} +11/06/2021 22:48:35 - INFO - __main__ - Step 11273: {'lr': 0.0004951735168868713, 'samples': 2164416, 'steps': 11272, 'loss/train': 1.8810991048812866} +11/06/2021 22:48:36 - INFO - __main__ - Step 11274: {'lr': 0.0004951724791066881, 'samples': 2164608, 'steps': 11273, 'loss/train': 1.8236666917800903} +11/06/2021 22:48:37 - INFO - __main__ - Step 11275: {'lr': 0.0004951714412160342, 'samples': 2164800, 'steps': 11274, 'loss/train': 1.84593665599823} +11/06/2021 22:48:37 - INFO - __main__ - Step 11276: {'lr': 0.0004951704032149096, 'samples': 2164992, 'steps': 11275, 'loss/train': 1.9748361110687256} +11/06/2021 22:48:37 - INFO - __main__ - Step 11277: {'lr': 0.000495169365103315, 'samples': 2165184, 'steps': 11276, 'loss/train': 1.7609519958496094} +11/06/2021 22:48:38 - INFO - __main__ - Step 11278: {'lr': 0.0004951683268812511, 'samples': 2165376, 'steps': 11277, 'loss/train': 2.1392531394958496} +11/06/2021 22:48:38 - INFO - __main__ - Step 11279: {'lr': 0.0004951672885487178, 'samples': 2165568, 'steps': 11278, 'loss/train': 1.3590013980865479} +11/06/2021 22:48:39 - INFO - __main__ - Step 11280: {'lr': 0.0004951662501057161, 'samples': 2165760, 'steps': 11279, 'loss/train': 1.762505054473877} +11/06/2021 22:48:39 - INFO - __main__ - Step 11281: {'lr': 0.0004951652115522462, 'samples': 2165952, 'steps': 11280, 'loss/train': 1.7629950046539307} +11/06/2021 22:48:40 - INFO - __main__ - Step 11282: {'lr': 0.0004951641728883087, 'samples': 2166144, 'steps': 11281, 'loss/train': 2.0722081661224365} +11/06/2021 22:48:40 - INFO - __main__ - Step 11283: {'lr': 0.000495163134113904, 'samples': 2166336, 'steps': 11282, 'loss/train': 1.4518979787826538} +11/06/2021 22:48:40 - INFO - __main__ - Step 11284: {'lr': 0.0004951620952290325, 'samples': 2166528, 'steps': 11283, 'loss/train': 1.5402740240097046} +11/06/2021 22:48:41 - INFO - __main__ - Step 11285: {'lr': 0.0004951610562336949, 'samples': 2166720, 'steps': 11284, 'loss/train': 1.6244908571243286} +11/06/2021 22:48:42 - INFO - __main__ - Step 11286: {'lr': 0.0004951600171278914, 'samples': 2166912, 'steps': 11285, 'loss/train': 1.898524522781372} +11/06/2021 22:48:42 - INFO - __main__ - Step 11287: {'lr': 0.0004951589779116225, 'samples': 2167104, 'steps': 11286, 'loss/train': 1.5938304662704468} +11/06/2021 22:48:42 - INFO - __main__ - Step 11288: {'lr': 0.0004951579385848889, 'samples': 2167296, 'steps': 11287, 'loss/train': 1.7559034824371338} +11/06/2021 22:48:43 - INFO - __main__ - Step 11289: {'lr': 0.0004951568991476908, 'samples': 2167488, 'steps': 11288, 'loss/train': 1.3978345394134521} +11/06/2021 22:48:44 - INFO - __main__ - Step 11290: {'lr': 0.0004951558596000289, 'samples': 2167680, 'steps': 11289, 'loss/train': 2.016148328781128} +11/06/2021 22:48:44 - INFO - __main__ - Step 11291: {'lr': 0.0004951548199419035, 'samples': 2167872, 'steps': 11290, 'loss/train': 1.7956223487854004} +11/06/2021 22:48:45 - INFO - __main__ - Step 11292: {'lr': 0.0004951537801733152, 'samples': 2168064, 'steps': 11291, 'loss/train': 2.4459264278411865} +11/06/2021 22:48:45 - INFO - __main__ - Step 11293: {'lr': 0.0004951527402942643, 'samples': 2168256, 'steps': 11292, 'loss/train': 1.4760860204696655} +11/06/2021 22:48:45 - INFO - __main__ - Step 11294: {'lr': 0.0004951517003047512, 'samples': 2168448, 'steps': 11293, 'loss/train': 1.7521895170211792} +11/06/2021 22:48:46 - INFO - __main__ - Step 11295: {'lr': 0.0004951506602047767, 'samples': 2168640, 'steps': 11294, 'loss/train': 1.6032721996307373} +11/06/2021 22:48:47 - INFO - __main__ - Step 11296: {'lr': 0.0004951496199943412, 'samples': 2168832, 'steps': 11295, 'loss/train': 1.7261722087860107} +11/06/2021 22:48:47 - INFO - __main__ - Step 11297: {'lr': 0.0004951485796734448, 'samples': 2169024, 'steps': 11296, 'loss/train': 1.5861694812774658} +11/06/2021 22:48:47 - INFO - __main__ - Step 11298: {'lr': 0.0004951475392420884, 'samples': 2169216, 'steps': 11297, 'loss/train': 2.0938913822174072} +11/06/2021 22:48:48 - INFO - __main__ - Step 11299: {'lr': 0.0004951464987002724, 'samples': 2169408, 'steps': 11298, 'loss/train': 1.6789658069610596} +11/06/2021 22:48:49 - INFO - __main__ - Step 11300: {'lr': 0.000495145458047997, 'samples': 2169600, 'steps': 11299, 'loss/train': 1.7498912811279297} +11/06/2021 22:48:49 - INFO - __main__ - Step 11301: {'lr': 0.0004951444172852629, 'samples': 2169792, 'steps': 11300, 'loss/train': 1.6389604806900024} +11/06/2021 22:48:50 - INFO - __main__ - Step 11302: {'lr': 0.0004951433764120705, 'samples': 2169984, 'steps': 11301, 'loss/train': 1.9538257122039795} +11/06/2021 22:48:50 - INFO - __main__ - Step 11303: {'lr': 0.0004951423354284202, 'samples': 2170176, 'steps': 11302, 'loss/train': 1.9088263511657715} +11/06/2021 22:48:50 - INFO - __main__ - Step 11304: {'lr': 0.0004951412943343126, 'samples': 2170368, 'steps': 11303, 'loss/train': 1.584460735321045} +11/06/2021 22:48:51 - INFO - __main__ - Step 11305: {'lr': 0.0004951402531297482, 'samples': 2170560, 'steps': 11304, 'loss/train': 2.0329270362854004} +11/06/2021 22:48:52 - INFO - __main__ - Step 11306: {'lr': 0.0004951392118147273, 'samples': 2170752, 'steps': 11305, 'loss/train': 1.8602527379989624} +11/06/2021 22:48:52 - INFO - __main__ - Step 11307: {'lr': 0.0004951381703892506, 'samples': 2170944, 'steps': 11306, 'loss/train': 2.025909185409546} +11/06/2021 22:48:52 - INFO - __main__ - Step 11308: {'lr': 0.0004951371288533182, 'samples': 2171136, 'steps': 11307, 'loss/train': 2.1841092109680176} +11/06/2021 22:48:53 - INFO - __main__ - Step 11309: {'lr': 0.0004951360872069309, 'samples': 2171328, 'steps': 11308, 'loss/train': 1.3344480991363525} +11/06/2021 22:48:53 - INFO - __main__ - Step 11310: {'lr': 0.0004951350454500891, 'samples': 2171520, 'steps': 11309, 'loss/train': 1.7531185150146484} +11/06/2021 22:48:54 - INFO - __main__ - Step 11311: {'lr': 0.0004951340035827932, 'samples': 2171712, 'steps': 11310, 'loss/train': 1.6113486289978027} +11/06/2021 22:48:54 - INFO - __main__ - Step 11312: {'lr': 0.0004951329616050437, 'samples': 2171904, 'steps': 11311, 'loss/train': 1.9962801933288574} +11/06/2021 22:48:55 - INFO - __main__ - Step 11313: {'lr': 0.000495131919516841, 'samples': 2172096, 'steps': 11312, 'loss/train': 1.5207346677780151} +11/06/2021 22:48:55 - INFO - __main__ - Step 11314: {'lr': 0.0004951308773181856, 'samples': 2172288, 'steps': 11313, 'loss/train': 2.1913249492645264} +11/06/2021 22:48:55 - INFO - __main__ - Step 11315: {'lr': 0.0004951298350090782, 'samples': 2172480, 'steps': 11314, 'loss/train': 1.2448691129684448} +11/06/2021 22:48:56 - INFO - __main__ - Step 11316: {'lr': 0.000495128792589519, 'samples': 2172672, 'steps': 11315, 'loss/train': 2.215278387069702} +11/06/2021 22:48:57 - INFO - __main__ - Step 11317: {'lr': 0.0004951277500595085, 'samples': 2172864, 'steps': 11316, 'loss/train': 1.4738010168075562} +11/06/2021 22:48:57 - INFO - __main__ - Step 11318: {'lr': 0.0004951267074190473, 'samples': 2173056, 'steps': 11317, 'loss/train': 1.4282978773117065} +11/06/2021 22:48:58 - INFO - __main__ - Step 11319: {'lr': 0.0004951256646681356, 'samples': 2173248, 'steps': 11318, 'loss/train': 1.662163496017456} +11/06/2021 22:48:58 - INFO - __main__ - Step 11320: {'lr': 0.0004951246218067744, 'samples': 2173440, 'steps': 11319, 'loss/train': 1.9382797479629517} +11/06/2021 22:48:59 - INFO - __main__ - Step 11321: {'lr': 0.0004951235788349636, 'samples': 2173632, 'steps': 11320, 'loss/train': 3.9597983360290527} +11/06/2021 22:48:59 - INFO - __main__ - Step 11322: {'lr': 0.0004951225357527038, 'samples': 2173824, 'steps': 11321, 'loss/train': 1.7996548414230347} +11/06/2021 22:49:00 - INFO - __main__ - Step 11323: {'lr': 0.0004951214925599957, 'samples': 2174016, 'steps': 11322, 'loss/train': 1.6424283981323242} +11/06/2021 22:49:00 - INFO - __main__ - Step 11324: {'lr': 0.0004951204492568397, 'samples': 2174208, 'steps': 11323, 'loss/train': 1.757283329963684} +11/06/2021 22:49:00 - INFO - __main__ - Step 11325: {'lr': 0.0004951194058432361, 'samples': 2174400, 'steps': 11324, 'loss/train': 1.688281774520874} +11/06/2021 22:49:01 - INFO - __main__ - Step 11326: {'lr': 0.0004951183623191855, 'samples': 2174592, 'steps': 11325, 'loss/train': 1.493397831916809} +11/06/2021 22:49:02 - INFO - __main__ - Step 11327: {'lr': 0.0004951173186846884, 'samples': 2174784, 'steps': 11326, 'loss/train': 3.6629881858825684} +11/06/2021 22:49:02 - INFO - __main__ - Step 11328: {'lr': 0.0004951162749397452, 'samples': 2174976, 'steps': 11327, 'loss/train': 3.2852323055267334} +11/06/2021 22:49:03 - INFO - __main__ - Step 11329: {'lr': 0.0004951152310843564, 'samples': 2175168, 'steps': 11328, 'loss/train': 1.8344948291778564} +11/06/2021 22:49:03 - INFO - __main__ - Step 11330: {'lr': 0.0004951141871185224, 'samples': 2175360, 'steps': 11329, 'loss/train': 2.280247449874878} +11/06/2021 22:49:03 - INFO - __main__ - Step 11331: {'lr': 0.0004951131430422438, 'samples': 2175552, 'steps': 11330, 'loss/train': 1.4350394010543823} +11/06/2021 22:49:05 - INFO - __main__ - Step 11332: {'lr': 0.0004951120988555209, 'samples': 2175744, 'steps': 11331, 'loss/train': 2.2273924350738525} +11/06/2021 22:49:05 - INFO - __main__ - Step 11333: {'lr': 0.0004951110545583543, 'samples': 2175936, 'steps': 11332, 'loss/train': 1.8531851768493652} +11/06/2021 22:49:05 - INFO - __main__ - Step 11334: {'lr': 0.0004951100101507445, 'samples': 2176128, 'steps': 11333, 'loss/train': 1.8258116245269775} +11/06/2021 22:49:06 - INFO - __main__ - Step 11335: {'lr': 0.0004951089656326919, 'samples': 2176320, 'steps': 11334, 'loss/train': 0.3128710389137268} +11/06/2021 22:49:06 - INFO - __main__ - Step 11336: {'lr': 0.0004951079210041969, 'samples': 2176512, 'steps': 11335, 'loss/train': 1.8034968376159668} +11/06/2021 22:49:06 - INFO - __main__ - Step 11337: {'lr': 0.0004951068762652602, 'samples': 2176704, 'steps': 11336, 'loss/train': 1.5365264415740967} +11/06/2021 22:49:07 - INFO - __main__ - Step 11338: {'lr': 0.000495105831415882, 'samples': 2176896, 'steps': 11337, 'loss/train': 1.9638972282409668} +11/06/2021 22:49:08 - INFO - __main__ - Step 11339: {'lr': 0.0004951047864560629, 'samples': 2177088, 'steps': 11338, 'loss/train': 1.64912748336792} +11/06/2021 22:49:08 - INFO - __main__ - Step 11340: {'lr': 0.0004951037413858034, 'samples': 2177280, 'steps': 11339, 'loss/train': 1.4875028133392334} +11/06/2021 22:49:08 - INFO - __main__ - Step 11341: {'lr': 0.000495102696205104, 'samples': 2177472, 'steps': 11340, 'loss/train': 1.8226743936538696} +11/06/2021 22:49:09 - INFO - __main__ - Step 11342: {'lr': 0.000495101650913965, 'samples': 2177664, 'steps': 11341, 'loss/train': 1.8261113166809082} +11/06/2021 22:49:10 - INFO - __main__ - Step 11343: {'lr': 0.000495100605512387, 'samples': 2177856, 'steps': 11342, 'loss/train': 1.8620246648788452} +11/06/2021 22:49:10 - INFO - __main__ - Step 11344: {'lr': 0.0004950995600003705, 'samples': 2178048, 'steps': 11343, 'loss/train': 1.7309132814407349} +11/06/2021 22:49:10 - INFO - __main__ - Step 11345: {'lr': 0.0004950985143779159, 'samples': 2178240, 'steps': 11344, 'loss/train': 1.5737980604171753} +11/06/2021 22:49:11 - INFO - __main__ - Step 11346: {'lr': 0.0004950974686450237, 'samples': 2178432, 'steps': 11345, 'loss/train': 1.4471863508224487} +11/06/2021 22:49:11 - INFO - __main__ - Step 11347: {'lr': 0.0004950964228016944, 'samples': 2178624, 'steps': 11346, 'loss/train': 1.8836588859558105} +11/06/2021 22:49:12 - INFO - __main__ - Step 11348: {'lr': 0.0004950953768479284, 'samples': 2178816, 'steps': 11347, 'loss/train': 1.526648998260498} +11/06/2021 22:49:12 - INFO - __main__ - Step 11349: {'lr': 0.0004950943307837261, 'samples': 2179008, 'steps': 11348, 'loss/train': 1.9713560342788696} +11/06/2021 22:49:13 - INFO - __main__ - Step 11350: {'lr': 0.0004950932846090882, 'samples': 2179200, 'steps': 11349, 'loss/train': 1.60298490524292} +11/06/2021 22:49:13 - INFO - __main__ - Step 11351: {'lr': 0.000495092238324015, 'samples': 2179392, 'steps': 11350, 'loss/train': 1.1730953454971313} +11/06/2021 22:49:13 - INFO - __main__ - Step 11352: {'lr': 0.0004950911919285071, 'samples': 2179584, 'steps': 11351, 'loss/train': 1.5877281427383423} +11/06/2021 22:49:15 - INFO - __main__ - Step 11353: {'lr': 0.0004950901454225647, 'samples': 2179776, 'steps': 11352, 'loss/train': 1.8872724771499634} +11/06/2021 22:49:15 - INFO - __main__ - Step 11354: {'lr': 0.0004950890988061886, 'samples': 2179968, 'steps': 11353, 'loss/train': 2.0779507160186768} +11/06/2021 22:49:15 - INFO - __main__ - Step 11355: {'lr': 0.0004950880520793791, 'samples': 2180160, 'steps': 11354, 'loss/train': 1.030417561531067} +11/06/2021 22:49:16 - INFO - __main__ - Step 11356: {'lr': 0.0004950870052421368, 'samples': 2180352, 'steps': 11355, 'loss/train': 1.806678295135498} +11/06/2021 22:49:16 - INFO - __main__ - Step 11357: {'lr': 0.000495085958294462, 'samples': 2180544, 'steps': 11356, 'loss/train': 1.621626377105713} +11/06/2021 22:49:17 - INFO - __main__ - Step 11358: {'lr': 0.0004950849112363553, 'samples': 2180736, 'steps': 11357, 'loss/train': 0.5637978911399841} +11/06/2021 22:49:17 - INFO - __main__ - Step 11359: {'lr': 0.000495083864067817, 'samples': 2180928, 'steps': 11358, 'loss/train': 1.728484869003296} +11/06/2021 22:49:18 - INFO - __main__ - Step 11360: {'lr': 0.0004950828167888478, 'samples': 2181120, 'steps': 11359, 'loss/train': 1.9310498237609863} +11/06/2021 22:49:18 - INFO - __main__ - Step 11361: {'lr': 0.0004950817693994481, 'samples': 2181312, 'steps': 11360, 'loss/train': 1.8141530752182007} +11/06/2021 22:49:18 - INFO - __main__ - Step 11362: {'lr': 0.0004950807218996182, 'samples': 2181504, 'steps': 11361, 'loss/train': 2.154552936553955} +11/06/2021 22:49:19 - INFO - __main__ - Step 11363: {'lr': 0.0004950796742893588, 'samples': 2181696, 'steps': 11362, 'loss/train': 1.7956241369247437} +11/06/2021 22:49:20 - INFO - __main__ - Step 11364: {'lr': 0.0004950786265686702, 'samples': 2181888, 'steps': 11363, 'loss/train': 1.6461005210876465} +11/06/2021 22:49:20 - INFO - __main__ - Step 11365: {'lr': 0.000495077578737553, 'samples': 2182080, 'steps': 11364, 'loss/train': 1.5644863843917847} +11/06/2021 22:49:20 - INFO - __main__ - Step 11366: {'lr': 0.0004950765307960076, 'samples': 2182272, 'steps': 11365, 'loss/train': 1.4656745195388794} +11/06/2021 22:49:21 - INFO - __main__ - Step 11367: {'lr': 0.0004950754827440346, 'samples': 2182464, 'steps': 11366, 'loss/train': 1.9674415588378906} +11/06/2021 22:49:21 - INFO - __main__ - Step 11368: {'lr': 0.0004950744345816342, 'samples': 2182656, 'steps': 11367, 'loss/train': 1.2006498575210571} +11/06/2021 22:49:22 - INFO - __main__ - Step 11369: {'lr': 0.0004950733863088072, 'samples': 2182848, 'steps': 11368, 'loss/train': 2.536311388015747} +11/06/2021 22:49:22 - INFO - __main__ - Step 11370: {'lr': 0.0004950723379255538, 'samples': 2183040, 'steps': 11369, 'loss/train': 1.9103096723556519} +11/06/2021 22:49:23 - INFO - __main__ - Step 11371: {'lr': 0.0004950712894318748, 'samples': 2183232, 'steps': 11370, 'loss/train': 1.7062427997589111} +11/06/2021 22:49:23 - INFO - __main__ - Step 11372: {'lr': 0.0004950702408277702, 'samples': 2183424, 'steps': 11371, 'loss/train': 1.4938647747039795} +11/06/2021 22:49:23 - INFO - __main__ - Step 11373: {'lr': 0.0004950691921132409, 'samples': 2183616, 'steps': 11372, 'loss/train': 1.9969819784164429} +11/06/2021 22:49:24 - INFO - __main__ - Step 11374: {'lr': 0.000495068143288287, 'samples': 2183808, 'steps': 11373, 'loss/train': 1.8315733671188354} +11/06/2021 22:49:25 - INFO - __main__ - Step 11375: {'lr': 0.0004950670943529094, 'samples': 2184000, 'steps': 11374, 'loss/train': 0.9384849071502686} +11/06/2021 22:49:25 - INFO - __main__ - Step 11376: {'lr': 0.0004950660453071082, 'samples': 2184192, 'steps': 11375, 'loss/train': 1.814307689666748} +11/06/2021 22:49:25 - INFO - __main__ - Step 11377: {'lr': 0.0004950649961508841, 'samples': 2184384, 'steps': 11376, 'loss/train': 2.194822311401367} +11/06/2021 22:49:26 - INFO - __main__ - Step 11378: {'lr': 0.0004950639468842375, 'samples': 2184576, 'steps': 11377, 'loss/train': 2.181577205657959} +11/06/2021 22:49:27 - INFO - __main__ - Step 11379: {'lr': 0.0004950628975071688, 'samples': 2184768, 'steps': 11378, 'loss/train': 1.6916229724884033} +11/06/2021 22:49:27 - INFO - __main__ - Step 11380: {'lr': 0.0004950618480196785, 'samples': 2184960, 'steps': 11379, 'loss/train': 1.5891834497451782} +11/06/2021 22:49:28 - INFO - __main__ - Step 11381: {'lr': 0.0004950607984217674, 'samples': 2185152, 'steps': 11380, 'loss/train': 1.64052414894104} +11/06/2021 22:49:28 - INFO - __main__ - Step 11382: {'lr': 0.0004950597487134354, 'samples': 2185344, 'steps': 11381, 'loss/train': 2.620680570602417} +11/06/2021 22:49:28 - INFO - __main__ - Step 11383: {'lr': 0.0004950586988946834, 'samples': 2185536, 'steps': 11382, 'loss/train': 1.9298031330108643} +11/06/2021 22:49:29 - INFO - __main__ - Step 11384: {'lr': 0.0004950576489655116, 'samples': 2185728, 'steps': 11383, 'loss/train': 1.8474303483963013} +11/06/2021 22:49:30 - INFO - __main__ - Step 11385: {'lr': 0.0004950565989259207, 'samples': 2185920, 'steps': 11384, 'loss/train': 1.4204002618789673} +11/06/2021 22:49:30 - INFO - __main__ - Step 11386: {'lr': 0.000495055548775911, 'samples': 2186112, 'steps': 11385, 'loss/train': 1.618093729019165} +11/06/2021 22:49:30 - INFO - __main__ - Step 11387: {'lr': 0.0004950544985154831, 'samples': 2186304, 'steps': 11386, 'loss/train': 2.119515895843506} +11/06/2021 22:49:31 - INFO - __main__ - Step 11388: {'lr': 0.0004950534481446375, 'samples': 2186496, 'steps': 11387, 'loss/train': 2.0047428607940674} +11/06/2021 22:49:31 - INFO - __main__ - Step 11389: {'lr': 0.0004950523976633745, 'samples': 2186688, 'steps': 11388, 'loss/train': 1.9979164600372314} +11/06/2021 22:49:32 - INFO - __main__ - Step 11390: {'lr': 0.0004950513470716947, 'samples': 2186880, 'steps': 11389, 'loss/train': 1.188913345336914} +11/06/2021 22:49:32 - INFO - __main__ - Step 11391: {'lr': 0.0004950502963695985, 'samples': 2187072, 'steps': 11390, 'loss/train': 1.6476091146469116} +11/06/2021 22:49:33 - INFO - __main__ - Step 11392: {'lr': 0.0004950492455570865, 'samples': 2187264, 'steps': 11391, 'loss/train': 7.051599502563477} +11/06/2021 22:49:33 - INFO - __main__ - Step 11393: {'lr': 0.000495048194634159, 'samples': 2187456, 'steps': 11392, 'loss/train': 1.676889419555664} +11/06/2021 22:49:33 - INFO - __main__ - Step 11394: {'lr': 0.0004950471436008167, 'samples': 2187648, 'steps': 11393, 'loss/train': 1.9109240770339966} +11/06/2021 22:49:35 - INFO - __main__ - Step 11395: {'lr': 0.0004950460924570598, 'samples': 2187840, 'steps': 11394, 'loss/train': 1.9026075601577759} +11/06/2021 22:49:35 - INFO - __main__ - Step 11396: {'lr': 0.0004950450412028889, 'samples': 2188032, 'steps': 11395, 'loss/train': 1.8585050106048584} +11/06/2021 22:49:35 - INFO - __main__ - Step 11397: {'lr': 0.0004950439898383047, 'samples': 2188224, 'steps': 11396, 'loss/train': 2.125458002090454} +11/06/2021 22:49:36 - INFO - __main__ - Step 11398: {'lr': 0.0004950429383633073, 'samples': 2188416, 'steps': 11397, 'loss/train': 1.5339622497558594} +11/06/2021 22:49:36 - INFO - __main__ - Step 11399: {'lr': 0.0004950418867778973, 'samples': 2188608, 'steps': 11398, 'loss/train': 1.875319480895996} +11/06/2021 22:49:37 - INFO - __main__ - Step 11400: {'lr': 0.0004950408350820752, 'samples': 2188800, 'steps': 11399, 'loss/train': 1.5913536548614502} +11/06/2021 22:49:37 - INFO - __main__ - Step 11401: {'lr': 0.0004950397832758415, 'samples': 2188992, 'steps': 11400, 'loss/train': 1.3669840097427368} +11/06/2021 22:49:38 - INFO - __main__ - Step 11402: {'lr': 0.0004950387313591968, 'samples': 2189184, 'steps': 11401, 'loss/train': 1.8628370761871338} +11/06/2021 22:49:38 - INFO - __main__ - Step 11403: {'lr': 0.0004950376793321413, 'samples': 2189376, 'steps': 11402, 'loss/train': 1.7271697521209717} +11/06/2021 22:49:38 - INFO - __main__ - Step 11404: {'lr': 0.0004950366271946756, 'samples': 2189568, 'steps': 11403, 'loss/train': 2.1682770252227783} +11/06/2021 22:49:39 - INFO - __main__ - Step 11405: {'lr': 0.0004950355749468001, 'samples': 2189760, 'steps': 11404, 'loss/train': 1.8250188827514648} +11/06/2021 22:49:40 - INFO - __main__ - Step 11406: {'lr': 0.0004950345225885155, 'samples': 2189952, 'steps': 11405, 'loss/train': 1.594653844833374} +11/06/2021 22:49:40 - INFO - __main__ - Step 11407: {'lr': 0.0004950334701198222, 'samples': 2190144, 'steps': 11406, 'loss/train': 1.9516605138778687} +11/06/2021 22:49:40 - INFO - __main__ - Step 11408: {'lr': 0.0004950324175407204, 'samples': 2190336, 'steps': 11407, 'loss/train': 1.3681046962738037} +11/06/2021 22:49:41 - INFO - __main__ - Step 11409: {'lr': 0.0004950313648512108, 'samples': 2190528, 'steps': 11408, 'loss/train': 1.6536760330200195} +11/06/2021 22:49:42 - INFO - __main__ - Step 11410: {'lr': 0.0004950303120512939, 'samples': 2190720, 'steps': 11409, 'loss/train': 1.9302911758422852} +11/06/2021 22:49:42 - INFO - __main__ - Step 11411: {'lr': 0.0004950292591409701, 'samples': 2190912, 'steps': 11410, 'loss/train': 2.0202114582061768} +11/06/2021 22:49:42 - INFO - __main__ - Step 11412: {'lr': 0.0004950282061202399, 'samples': 2191104, 'steps': 11411, 'loss/train': 1.8923609256744385} +11/06/2021 22:49:43 - INFO - __main__ - Step 11413: {'lr': 0.0004950271529891038, 'samples': 2191296, 'steps': 11412, 'loss/train': 1.6358274221420288} +11/06/2021 22:49:43 - INFO - __main__ - Step 11414: {'lr': 0.0004950260997475623, 'samples': 2191488, 'steps': 11413, 'loss/train': 1.7055529356002808} +11/06/2021 22:49:43 - INFO - __main__ - Step 11415: {'lr': 0.0004950250463956157, 'samples': 2191680, 'steps': 11414, 'loss/train': 1.4822801351547241} +11/06/2021 22:49:44 - INFO - __main__ - Step 11416: {'lr': 0.0004950239929332646, 'samples': 2191872, 'steps': 11415, 'loss/train': 1.7098220586776733} +11/06/2021 22:49:45 - INFO - __main__ - Step 11417: {'lr': 0.0004950229393605095, 'samples': 2192064, 'steps': 11416, 'loss/train': 1.437166690826416} +11/06/2021 22:49:45 - INFO - __main__ - Step 11418: {'lr': 0.0004950218856773509, 'samples': 2192256, 'steps': 11417, 'loss/train': 1.7919132709503174} +11/06/2021 22:49:46 - INFO - __main__ - Step 11419: {'lr': 0.0004950208318837892, 'samples': 2192448, 'steps': 11418, 'loss/train': 1.5548012256622314} +11/06/2021 22:49:46 - INFO - __main__ - Step 11420: {'lr': 0.0004950197779798248, 'samples': 2192640, 'steps': 11419, 'loss/train': 1.615087628364563} +11/06/2021 22:49:47 - INFO - __main__ - Step 11421: {'lr': 0.0004950187239654584, 'samples': 2192832, 'steps': 11420, 'loss/train': 1.5422042608261108} +11/06/2021 22:49:47 - INFO - __main__ - Step 11422: {'lr': 0.0004950176698406903, 'samples': 2193024, 'steps': 11421, 'loss/train': 1.7497607469558716} +11/06/2021 22:49:48 - INFO - __main__ - Step 11423: {'lr': 0.000495016615605521, 'samples': 2193216, 'steps': 11422, 'loss/train': 1.8676695823669434} +11/06/2021 22:49:48 - INFO - __main__ - Step 11424: {'lr': 0.0004950155612599511, 'samples': 2193408, 'steps': 11423, 'loss/train': 1.7228354215621948} +11/06/2021 22:49:48 - INFO - __main__ - Step 11425: {'lr': 0.0004950145068039808, 'samples': 2193600, 'steps': 11424, 'loss/train': 2.0538418292999268} +11/06/2021 22:49:50 - INFO - __main__ - Step 11426: {'lr': 0.0004950134522376108, 'samples': 2193792, 'steps': 11425, 'loss/train': 2.0715749263763428} +11/06/2021 22:49:50 - INFO - __main__ - Step 11427: {'lr': 0.0004950123975608415, 'samples': 2193984, 'steps': 11426, 'loss/train': 1.7007184028625488} +11/06/2021 22:49:50 - INFO - __main__ - Step 11428: {'lr': 0.0004950113427736734, 'samples': 2194176, 'steps': 11427, 'loss/train': 3.19921612739563} +11/06/2021 22:49:51 - INFO - __main__ - Step 11429: {'lr': 0.000495010287876107, 'samples': 2194368, 'steps': 11428, 'loss/train': 1.4021397829055786} +11/06/2021 22:49:51 - INFO - __main__ - Step 11430: {'lr': 0.0004950092328681428, 'samples': 2194560, 'steps': 11429, 'loss/train': 1.3537622690200806} +11/06/2021 22:49:52 - INFO - __main__ - Step 11431: {'lr': 0.0004950081777497812, 'samples': 2194752, 'steps': 11430, 'loss/train': 2.075549840927124} +11/06/2021 22:49:52 - INFO - __main__ - Step 11432: {'lr': 0.0004950071225210226, 'samples': 2194944, 'steps': 11431, 'loss/train': 2.2437236309051514} +11/06/2021 22:49:53 - INFO - __main__ - Step 11433: {'lr': 0.0004950060671818676, 'samples': 2195136, 'steps': 11432, 'loss/train': 1.8015081882476807} +11/06/2021 22:49:53 - INFO - __main__ - Step 11434: {'lr': 0.0004950050117323167, 'samples': 2195328, 'steps': 11433, 'loss/train': 1.7495261430740356} +11/06/2021 22:49:54 - INFO - __main__ - Step 11435: {'lr': 0.0004950039561723703, 'samples': 2195520, 'steps': 11434, 'loss/train': 2.0817348957061768} +11/06/2021 22:49:54 - INFO - __main__ - Step 11436: {'lr': 0.0004950029005020289, 'samples': 2195712, 'steps': 11435, 'loss/train': 1.7753431797027588} +11/06/2021 22:49:55 - INFO - __main__ - Step 11437: {'lr': 0.0004950018447212929, 'samples': 2195904, 'steps': 11436, 'loss/train': 2.0094332695007324} +11/06/2021 22:49:55 - INFO - __main__ - Step 11438: {'lr': 0.000495000788830163, 'samples': 2196096, 'steps': 11437, 'loss/train': 1.0826306343078613} +11/06/2021 22:49:56 - INFO - __main__ - Step 11439: {'lr': 0.0004949997328286394, 'samples': 2196288, 'steps': 11438, 'loss/train': 1.5447814464569092} +11/06/2021 22:49:56 - INFO - __main__ - Step 11440: {'lr': 0.0004949986767167228, 'samples': 2196480, 'steps': 11439, 'loss/train': 1.7402944564819336} +11/06/2021 22:49:56 - INFO - __main__ - Step 11441: {'lr': 0.0004949976204944135, 'samples': 2196672, 'steps': 11440, 'loss/train': 1.6975988149642944} +11/06/2021 22:49:57 - INFO - __main__ - Step 11442: {'lr': 0.0004949965641617121, 'samples': 2196864, 'steps': 11441, 'loss/train': 1.6777021884918213} +11/06/2021 22:49:58 - INFO - __main__ - Step 11443: {'lr': 0.000494995507718619, 'samples': 2197056, 'steps': 11442, 'loss/train': 1.3952085971832275} +11/06/2021 22:49:58 - INFO - __main__ - Step 11444: {'lr': 0.0004949944511651347, 'samples': 2197248, 'steps': 11443, 'loss/train': 1.7834969758987427} +11/06/2021 22:49:58 - INFO - __main__ - Step 11445: {'lr': 0.0004949933945012597, 'samples': 2197440, 'steps': 11444, 'loss/train': 1.753387212753296} +11/06/2021 22:49:59 - INFO - __main__ - Step 11446: {'lr': 0.0004949923377269945, 'samples': 2197632, 'steps': 11445, 'loss/train': 2.039705753326416} +11/06/2021 22:49:59 - INFO - __main__ - Step 11447: {'lr': 0.0004949912808423394, 'samples': 2197824, 'steps': 11446, 'loss/train': 1.4728835821151733} +11/06/2021 22:50:01 - INFO - __main__ - Step 11448: {'lr': 0.000494990223847295, 'samples': 2198016, 'steps': 11447, 'loss/train': 1.628504991531372} +11/06/2021 22:50:01 - INFO - __main__ - Step 11449: {'lr': 0.000494989166741862, 'samples': 2198208, 'steps': 11448, 'loss/train': 2.0440473556518555} +11/06/2021 22:50:01 - INFO - __main__ - Step 11450: {'lr': 0.0004949881095260405, 'samples': 2198400, 'steps': 11449, 'loss/train': 1.660749912261963} +11/06/2021 22:50:02 - INFO - __main__ - Step 11451: {'lr': 0.0004949870521998312, 'samples': 2198592, 'steps': 11450, 'loss/train': 1.8337377309799194} +11/06/2021 22:50:02 - INFO - __main__ - Step 11452: {'lr': 0.0004949859947632344, 'samples': 2198784, 'steps': 11451, 'loss/train': 1.8013213872909546} +11/06/2021 22:50:03 - INFO - __main__ - Step 11453: {'lr': 0.0004949849372162509, 'samples': 2198976, 'steps': 11452, 'loss/train': 1.1063177585601807} +11/06/2021 22:50:03 - INFO - __main__ - Step 11454: {'lr': 0.0004949838795588808, 'samples': 2199168, 'steps': 11453, 'loss/train': 1.6007579565048218} +11/06/2021 22:50:04 - INFO - __main__ - Step 11455: {'lr': 0.0004949828217911248, 'samples': 2199360, 'steps': 11454, 'loss/train': 1.6126108169555664} +11/06/2021 22:50:04 - INFO - __main__ - Step 11456: {'lr': 0.0004949817639129832, 'samples': 2199552, 'steps': 11455, 'loss/train': 1.85826575756073} +11/06/2021 22:50:04 - INFO - __main__ - Step 11457: {'lr': 0.0004949807059244568, 'samples': 2199744, 'steps': 11456, 'loss/train': 1.6572095155715942} +11/06/2021 22:50:05 - INFO - __main__ - Step 11458: {'lr': 0.0004949796478255458, 'samples': 2199936, 'steps': 11457, 'loss/train': 1.5031503438949585} +11/06/2021 22:50:06 - INFO - __main__ - Step 11459: {'lr': 0.0004949785896162507, 'samples': 2200128, 'steps': 11458, 'loss/train': 1.6806023120880127} +11/06/2021 22:50:06 - INFO - __main__ - Step 11460: {'lr': 0.0004949775312965721, 'samples': 2200320, 'steps': 11459, 'loss/train': 1.5449903011322021} +11/06/2021 22:50:06 - INFO - __main__ - Step 11461: {'lr': 0.0004949764728665103, 'samples': 2200512, 'steps': 11460, 'loss/train': 1.651967167854309} +11/06/2021 22:50:07 - INFO - __main__ - Step 11462: {'lr': 0.000494975414326066, 'samples': 2200704, 'steps': 11461, 'loss/train': 1.8669898509979248} +11/06/2021 22:50:07 - INFO - __main__ - Step 11463: {'lr': 0.0004949743556752395, 'samples': 2200896, 'steps': 11462, 'loss/train': 1.9016015529632568} +11/06/2021 22:50:08 - INFO - __main__ - Step 11464: {'lr': 0.0004949732969140313, 'samples': 2201088, 'steps': 11463, 'loss/train': 1.5884931087493896} +11/06/2021 22:50:09 - INFO - __main__ - Step 11465: {'lr': 0.000494972238042442, 'samples': 2201280, 'steps': 11464, 'loss/train': 1.8496793508529663} +11/06/2021 22:50:09 - INFO - __main__ - Step 11466: {'lr': 0.0004949711790604719, 'samples': 2201472, 'steps': 11465, 'loss/train': 1.83021879196167} +11/06/2021 22:50:09 - INFO - __main__ - Step 11467: {'lr': 0.0004949701199681217, 'samples': 2201664, 'steps': 11466, 'loss/train': 1.7761445045471191} +11/06/2021 22:50:10 - INFO - __main__ - Step 11468: {'lr': 0.0004949690607653916, 'samples': 2201856, 'steps': 11467, 'loss/train': 1.5645625591278076} +11/06/2021 22:50:10 - INFO - __main__ - Step 11469: {'lr': 0.0004949680014522822, 'samples': 2202048, 'steps': 11468, 'loss/train': 1.7550435066223145} +11/06/2021 22:50:11 - INFO - __main__ - Step 11470: {'lr': 0.0004949669420287941, 'samples': 2202240, 'steps': 11469, 'loss/train': 1.595177412033081} +11/06/2021 22:50:11 - INFO - __main__ - Step 11471: {'lr': 0.0004949658824949277, 'samples': 2202432, 'steps': 11470, 'loss/train': 1.6120365858078003} +11/06/2021 22:50:12 - INFO - __main__ - Step 11472: {'lr': 0.0004949648228506834, 'samples': 2202624, 'steps': 11471, 'loss/train': 1.6954563856124878} +11/06/2021 22:50:12 - INFO - __main__ - Step 11473: {'lr': 0.0004949637630960618, 'samples': 2202816, 'steps': 11472, 'loss/train': 1.4135258197784424} +11/06/2021 22:50:13 - INFO - __main__ - Step 11474: {'lr': 0.0004949627032310632, 'samples': 2203008, 'steps': 11473, 'loss/train': 1.074235200881958} +11/06/2021 22:50:13 - INFO - __main__ - Step 11475: {'lr': 0.0004949616432556882, 'samples': 2203200, 'steps': 11474, 'loss/train': 2.001767635345459} +11/06/2021 22:50:14 - INFO - __main__ - Step 11476: {'lr': 0.0004949605831699373, 'samples': 2203392, 'steps': 11475, 'loss/train': 1.4366241693496704} +11/06/2021 22:50:14 - INFO - __main__ - Step 11477: {'lr': 0.000494959522973811, 'samples': 2203584, 'steps': 11476, 'loss/train': 1.5947993993759155} +11/06/2021 22:50:14 - INFO - __main__ - Step 11478: {'lr': 0.0004949584626673096, 'samples': 2203776, 'steps': 11477, 'loss/train': 1.586674451828003} +11/06/2021 22:50:15 - INFO - __main__ - Step 11479: {'lr': 0.0004949574022504338, 'samples': 2203968, 'steps': 11478, 'loss/train': 1.7831062078475952} +11/06/2021 22:50:16 - INFO - __main__ - Step 11480: {'lr': 0.0004949563417231838, 'samples': 2204160, 'steps': 11479, 'loss/train': 2.0792524814605713} +11/06/2021 22:50:16 - INFO - __main__ - Step 11481: {'lr': 0.0004949552810855605, 'samples': 2204352, 'steps': 11480, 'loss/train': 1.7512733936309814} +11/06/2021 22:50:16 - INFO - __main__ - Step 11482: {'lr': 0.000494954220337564, 'samples': 2204544, 'steps': 11481, 'loss/train': 1.9360369443893433} +11/06/2021 22:50:17 - INFO - __main__ - Step 11483: {'lr': 0.0004949531594791948, 'samples': 2204736, 'steps': 11482, 'loss/train': 0.5724799633026123} +11/06/2021 22:50:18 - INFO - __main__ - Step 11484: {'lr': 0.0004949520985104536, 'samples': 2204928, 'steps': 11483, 'loss/train': 1.9736790657043457} +11/06/2021 22:50:18 - INFO - __main__ - Step 11485: {'lr': 0.0004949510374313409, 'samples': 2205120, 'steps': 11484, 'loss/train': 1.3778972625732422} +11/06/2021 22:50:18 - INFO - __main__ - Step 11486: {'lr': 0.0004949499762418568, 'samples': 2205312, 'steps': 11485, 'loss/train': 1.658096194267273} +11/06/2021 22:50:19 - INFO - __main__ - Step 11487: {'lr': 0.0004949489149420021, 'samples': 2205504, 'steps': 11486, 'loss/train': 1.9003406763076782} +11/06/2021 22:50:19 - INFO - __main__ - Step 11488: {'lr': 0.0004949478535317773, 'samples': 2205696, 'steps': 11487, 'loss/train': 1.31734299659729} +11/06/2021 22:50:20 - INFO - __main__ - Step 11489: {'lr': 0.0004949467920111827, 'samples': 2205888, 'steps': 11488, 'loss/train': 2.2677342891693115} +11/06/2021 22:50:21 - INFO - __main__ - Step 11490: {'lr': 0.0004949457303802189, 'samples': 2206080, 'steps': 11489, 'loss/train': 1.4590067863464355} +11/06/2021 22:50:21 - INFO - __main__ - Step 11491: {'lr': 0.0004949446686388862, 'samples': 2206272, 'steps': 11490, 'loss/train': 1.8408727645874023} +11/06/2021 22:50:21 - INFO - __main__ - Step 11492: {'lr': 0.0004949436067871854, 'samples': 2206464, 'steps': 11491, 'loss/train': 2.519899845123291} +11/06/2021 22:50:22 - INFO - __main__ - Step 11493: {'lr': 0.0004949425448251166, 'samples': 2206656, 'steps': 11492, 'loss/train': 1.598381757736206} +11/06/2021 22:50:22 - INFO - __main__ - Step 11494: {'lr': 0.0004949414827526805, 'samples': 2206848, 'steps': 11493, 'loss/train': 1.779862642288208} +11/06/2021 22:50:23 - INFO - __main__ - Step 11495: {'lr': 0.0004949404205698777, 'samples': 2207040, 'steps': 11494, 'loss/train': 1.9242050647735596} +11/06/2021 22:50:23 - INFO - __main__ - Step 11496: {'lr': 0.0004949393582767084, 'samples': 2207232, 'steps': 11495, 'loss/train': 1.6788808107376099} +11/06/2021 22:50:24 - INFO - __main__ - Step 11497: {'lr': 0.0004949382958731733, 'samples': 2207424, 'steps': 11496, 'loss/train': 1.5965083837509155} +11/06/2021 22:50:24 - INFO - __main__ - Step 11498: {'lr': 0.0004949372333592728, 'samples': 2207616, 'steps': 11497, 'loss/train': 2.236138105392456} +11/06/2021 22:50:24 - INFO - __main__ - Step 11499: {'lr': 0.0004949361707350072, 'samples': 2207808, 'steps': 11498, 'loss/train': 1.7686853408813477} +11/06/2021 22:50:25 - INFO - __main__ - Step 11500: {'lr': 0.0004949351080003773, 'samples': 2208000, 'steps': 11499, 'loss/train': 1.9962258338928223} +11/06/2021 22:50:26 - INFO - __main__ - Step 11501: {'lr': 0.0004949340451553833, 'samples': 2208192, 'steps': 11500, 'loss/train': 1.7358423471450806} +11/06/2021 22:50:26 - INFO - __main__ - Step 11502: {'lr': 0.0004949329822000259, 'samples': 2208384, 'steps': 11501, 'loss/train': 1.7392240762710571} +11/06/2021 22:50:26 - INFO - __main__ - Step 11503: {'lr': 0.0004949319191343053, 'samples': 2208576, 'steps': 11502, 'loss/train': 2.329840660095215} +11/06/2021 22:50:27 - INFO - __main__ - Step 11504: {'lr': 0.0004949308559582224, 'samples': 2208768, 'steps': 11503, 'loss/train': 1.5851150751113892} +11/06/2021 22:50:28 - INFO - __main__ - Step 11505: {'lr': 0.0004949297926717772, 'samples': 2208960, 'steps': 11504, 'loss/train': 1.932198166847229} +11/06/2021 22:50:28 - INFO - __main__ - Step 11506: {'lr': 0.0004949287292749705, 'samples': 2209152, 'steps': 11505, 'loss/train': 1.7171591520309448} +11/06/2021 22:50:29 - INFO - __main__ - Step 11507: {'lr': 0.0004949276657678028, 'samples': 2209344, 'steps': 11506, 'loss/train': 2.190236806869507} +11/06/2021 22:50:29 - INFO - __main__ - Step 11508: {'lr': 0.0004949266021502744, 'samples': 2209536, 'steps': 11507, 'loss/train': 1.2840288877487183} +11/06/2021 22:50:29 - INFO - __main__ - Step 11509: {'lr': 0.0004949255384223859, 'samples': 2209728, 'steps': 11508, 'loss/train': 0.29179802536964417} +11/06/2021 22:50:30 - INFO - __main__ - Step 11510: {'lr': 0.0004949244745841377, 'samples': 2209920, 'steps': 11509, 'loss/train': 1.3277264833450317} +11/06/2021 22:50:31 - INFO - __main__ - Step 11511: {'lr': 0.0004949234106355302, 'samples': 2210112, 'steps': 11510, 'loss/train': 2.052576780319214} +11/06/2021 22:50:31 - INFO - __main__ - Step 11512: {'lr': 0.0004949223465765642, 'samples': 2210304, 'steps': 11511, 'loss/train': 1.9434692859649658} +11/06/2021 22:50:32 - INFO - __main__ - Step 11513: {'lr': 0.0004949212824072398, 'samples': 2210496, 'steps': 11512, 'loss/train': 2.3121955394744873} +11/06/2021 22:50:32 - INFO - __main__ - Step 11514: {'lr': 0.0004949202181275577, 'samples': 2210688, 'steps': 11513, 'loss/train': 1.9893686771392822} +11/06/2021 22:50:32 - INFO - __main__ - Step 11515: {'lr': 0.0004949191537375184, 'samples': 2210880, 'steps': 11514, 'loss/train': 1.3614085912704468} +11/06/2021 22:50:33 - INFO - __main__ - Step 11516: {'lr': 0.0004949180892371223, 'samples': 2211072, 'steps': 11515, 'loss/train': 1.9664455652236938} +11/06/2021 22:50:34 - INFO - __main__ - Step 11517: {'lr': 0.0004949170246263697, 'samples': 2211264, 'steps': 11516, 'loss/train': 2.041748046875} +11/06/2021 22:50:34 - INFO - __main__ - Step 11518: {'lr': 0.0004949159599052614, 'samples': 2211456, 'steps': 11517, 'loss/train': 1.993459939956665} +11/06/2021 22:50:34 - INFO - __main__ - Step 11519: {'lr': 0.0004949148950737978, 'samples': 2211648, 'steps': 11518, 'loss/train': 1.6282458305358887} +11/06/2021 22:50:35 - INFO - __main__ - Step 11520: {'lr': 0.0004949138301319793, 'samples': 2211840, 'steps': 11519, 'loss/train': 1.2587100267410278} +11/06/2021 22:50:35 - INFO - __main__ - Step 11521: {'lr': 0.0004949127650798063, 'samples': 2212032, 'steps': 11520, 'loss/train': 1.619840145111084} +11/06/2021 22:50:36 - INFO - __main__ - Step 11522: {'lr': 0.0004949116999172795, 'samples': 2212224, 'steps': 11521, 'loss/train': 1.572475790977478} +11/06/2021 22:50:36 - INFO - __main__ - Step 11523: {'lr': 0.0004949106346443992, 'samples': 2212416, 'steps': 11522, 'loss/train': 1.6941105127334595} +11/06/2021 22:50:37 - INFO - __main__ - Step 11524: {'lr': 0.0004949095692611661, 'samples': 2212608, 'steps': 11523, 'loss/train': 1.9662777185440063} +11/06/2021 22:50:37 - INFO - __main__ - Step 11525: {'lr': 0.0004949085037675803, 'samples': 2212800, 'steps': 11524, 'loss/train': 1.7247838973999023} +11/06/2021 22:50:37 - INFO - __main__ - Step 11526: {'lr': 0.0004949074381636427, 'samples': 2212992, 'steps': 11525, 'loss/train': 1.9012329578399658} +11/06/2021 22:50:38 - INFO - __main__ - Step 11527: {'lr': 0.0004949063724493534, 'samples': 2213184, 'steps': 11526, 'loss/train': 1.9752020835876465} +11/06/2021 22:50:39 - INFO - __main__ - Step 11528: {'lr': 0.0004949053066247133, 'samples': 2213376, 'steps': 11527, 'loss/train': 1.4446111917495728} +11/06/2021 22:50:39 - INFO - __main__ - Step 11529: {'lr': 0.0004949042406897225, 'samples': 2213568, 'steps': 11528, 'loss/train': 1.739598274230957} +11/06/2021 22:50:40 - INFO - __main__ - Step 11530: {'lr': 0.0004949031746443816, 'samples': 2213760, 'steps': 11529, 'loss/train': 1.8068318367004395} +11/06/2021 22:50:40 - INFO - __main__ - Step 11531: {'lr': 0.0004949021084886912, 'samples': 2213952, 'steps': 11530, 'loss/train': 1.7446298599243164} +11/06/2021 22:50:41 - INFO - __main__ - Step 11532: {'lr': 0.0004949010422226517, 'samples': 2214144, 'steps': 11531, 'loss/train': 1.2922008037567139} +11/06/2021 22:50:41 - INFO - __main__ - Step 11533: {'lr': 0.0004948999758462634, 'samples': 2214336, 'steps': 11532, 'loss/train': 2.062342882156372} +11/06/2021 22:50:42 - INFO - __main__ - Step 11534: {'lr': 0.000494898909359527, 'samples': 2214528, 'steps': 11533, 'loss/train': 1.4486849308013916} +11/06/2021 22:50:42 - INFO - __main__ - Step 11535: {'lr': 0.0004948978427624431, 'samples': 2214720, 'steps': 11534, 'loss/train': 1.7897515296936035} +11/06/2021 22:50:42 - INFO - __main__ - Step 11536: {'lr': 0.0004948967760550119, 'samples': 2214912, 'steps': 11535, 'loss/train': 1.818204402923584} +11/06/2021 22:50:43 - INFO - __main__ - Step 11537: {'lr': 0.000494895709237234, 'samples': 2215104, 'steps': 11536, 'loss/train': 1.166475534439087} +11/06/2021 22:50:44 - INFO - __main__ - Step 11538: {'lr': 0.0004948946423091099, 'samples': 2215296, 'steps': 11537, 'loss/train': 1.8267381191253662} +11/06/2021 22:50:44 - INFO - __main__ - Step 11539: {'lr': 0.0004948935752706401, 'samples': 2215488, 'steps': 11538, 'loss/train': 2.1393001079559326} +11/06/2021 22:50:44 - INFO - __main__ - Step 11540: {'lr': 0.0004948925081218248, 'samples': 2215680, 'steps': 11539, 'loss/train': 1.0833170413970947} +11/06/2021 22:50:45 - INFO - __main__ - Step 11541: {'lr': 0.000494891440862665, 'samples': 2215872, 'steps': 11540, 'loss/train': 1.8711026906967163} +11/06/2021 22:50:46 - INFO - __main__ - Step 11542: {'lr': 0.0004948903734931608, 'samples': 2216064, 'steps': 11541, 'loss/train': 1.5871480703353882} +11/06/2021 22:50:46 - INFO - __main__ - Step 11543: {'lr': 0.0004948893060133128, 'samples': 2216256, 'steps': 11542, 'loss/train': 1.5107953548431396} +11/06/2021 22:50:47 - INFO - __main__ - Step 11544: {'lr': 0.0004948882384231213, 'samples': 2216448, 'steps': 11543, 'loss/train': 1.1852807998657227} +11/06/2021 22:50:47 - INFO - __main__ - Step 11545: {'lr': 0.0004948871707225871, 'samples': 2216640, 'steps': 11544, 'loss/train': 1.8642654418945312} +11/06/2021 22:50:47 - INFO - __main__ - Step 11546: {'lr': 0.0004948861029117104, 'samples': 2216832, 'steps': 11545, 'loss/train': 1.524583339691162} +11/06/2021 22:50:48 - INFO - __main__ - Step 11547: {'lr': 0.0004948850349904919, 'samples': 2217024, 'steps': 11546, 'loss/train': 1.7309693098068237} +11/06/2021 22:50:49 - INFO - __main__ - Step 11548: {'lr': 0.0004948839669589319, 'samples': 2217216, 'steps': 11547, 'loss/train': 1.4048861265182495} +11/06/2021 22:50:49 - INFO - __main__ - Step 11549: {'lr': 0.000494882898817031, 'samples': 2217408, 'steps': 11548, 'loss/train': 1.8817989826202393} +11/06/2021 22:50:49 - INFO - __main__ - Step 11550: {'lr': 0.0004948818305647897, 'samples': 2217600, 'steps': 11549, 'loss/train': 1.4648607969284058} +11/06/2021 22:50:50 - INFO - __main__ - Step 11551: {'lr': 0.0004948807622022083, 'samples': 2217792, 'steps': 11550, 'loss/train': 2.3621954917907715} +11/06/2021 22:50:50 - INFO - __main__ - Step 11552: {'lr': 0.0004948796937292875, 'samples': 2217984, 'steps': 11551, 'loss/train': 1.87119722366333} +11/06/2021 22:50:51 - INFO - __main__ - Step 11553: {'lr': 0.0004948786251460277, 'samples': 2218176, 'steps': 11552, 'loss/train': 2.0248570442199707} +11/06/2021 22:50:51 - INFO - __main__ - Step 11554: {'lr': 0.0004948775564524294, 'samples': 2218368, 'steps': 11553, 'loss/train': 2.0253686904907227} +11/06/2021 22:50:52 - INFO - __main__ - Step 11555: {'lr': 0.000494876487648493, 'samples': 2218560, 'steps': 11554, 'loss/train': 1.359278917312622} +11/06/2021 22:50:52 - INFO - __main__ - Step 11556: {'lr': 0.0004948754187342189, 'samples': 2218752, 'steps': 11555, 'loss/train': 2.02559757232666} +11/06/2021 22:50:52 - INFO - __main__ - Step 11557: {'lr': 0.0004948743497096079, 'samples': 2218944, 'steps': 11556, 'loss/train': 1.019589900970459} +11/06/2021 22:50:54 - INFO - __main__ - Step 11558: {'lr': 0.0004948732805746604, 'samples': 2219136, 'steps': 11557, 'loss/train': 1.860040545463562} +11/06/2021 22:50:54 - INFO - __main__ - Step 11559: {'lr': 0.0004948722113293766, 'samples': 2219328, 'steps': 11558, 'loss/train': 1.786012053489685} +11/06/2021 22:50:54 - INFO - __main__ - Step 11560: {'lr': 0.000494871141973757, 'samples': 2219520, 'steps': 11559, 'loss/train': 1.9296960830688477} +11/06/2021 22:50:55 - INFO - __main__ - Step 11561: {'lr': 0.0004948700725078025, 'samples': 2219712, 'steps': 11560, 'loss/train': 1.883889079093933} +11/06/2021 22:50:55 - INFO - __main__ - Step 11562: {'lr': 0.0004948690029315133, 'samples': 2219904, 'steps': 11561, 'loss/train': 1.7466262578964233} +11/06/2021 22:50:56 - INFO - __main__ - Step 11563: {'lr': 0.0004948679332448899, 'samples': 2220096, 'steps': 11562, 'loss/train': 1.7426663637161255} +11/06/2021 22:50:57 - INFO - __main__ - Step 11564: {'lr': 0.0004948668634479327, 'samples': 2220288, 'steps': 11563, 'loss/train': 2.0808141231536865} +11/06/2021 22:50:57 - INFO - __main__ - Step 11565: {'lr': 0.0004948657935406423, 'samples': 2220480, 'steps': 11564, 'loss/train': 1.635694980621338} +11/06/2021 22:50:57 - INFO - __main__ - Step 11566: {'lr': 0.0004948647235230192, 'samples': 2220672, 'steps': 11565, 'loss/train': 1.6016157865524292} +11/06/2021 22:50:58 - INFO - __main__ - Step 11567: {'lr': 0.0004948636533950638, 'samples': 2220864, 'steps': 11566, 'loss/train': 1.8231465816497803} +11/06/2021 22:50:59 - INFO - __main__ - Step 11568: {'lr': 0.0004948625831567766, 'samples': 2221056, 'steps': 11567, 'loss/train': 1.6762038469314575} +11/06/2021 22:50:59 - INFO - __main__ - Step 11569: {'lr': 0.000494861512808158, 'samples': 2221248, 'steps': 11568, 'loss/train': 1.9984252452850342} +11/06/2021 22:50:59 - INFO - __main__ - Step 11570: {'lr': 0.0004948604423492088, 'samples': 2221440, 'steps': 11569, 'loss/train': 1.8539700508117676} +11/06/2021 22:51:00 - INFO - __main__ - Step 11571: {'lr': 0.0004948593717799292, 'samples': 2221632, 'steps': 11570, 'loss/train': 1.6391667127609253} +11/06/2021 22:51:00 - INFO - __main__ - Step 11572: {'lr': 0.0004948583011003196, 'samples': 2221824, 'steps': 11571, 'loss/train': 1.7608556747436523} +11/06/2021 22:51:00 - INFO - __main__ - Step 11573: {'lr': 0.0004948572303103808, 'samples': 2222016, 'steps': 11572, 'loss/train': 1.8692219257354736} +11/06/2021 22:51:01 - INFO - __main__ - Step 11574: {'lr': 0.0004948561594101129, 'samples': 2222208, 'steps': 11573, 'loss/train': 1.743513584136963} +11/06/2021 22:51:02 - INFO - __main__ - Step 11575: {'lr': 0.0004948550883995168, 'samples': 2222400, 'steps': 11574, 'loss/train': 1.3404990434646606} +11/06/2021 22:51:02 - INFO - __main__ - Step 11576: {'lr': 0.0004948540172785927, 'samples': 2222592, 'steps': 11575, 'loss/train': 1.5622731447219849} +11/06/2021 22:51:02 - INFO - __main__ - Step 11577: {'lr': 0.0004948529460473412, 'samples': 2222784, 'steps': 11576, 'loss/train': 1.3603805303573608} +11/06/2021 22:51:03 - INFO - __main__ - Step 11578: {'lr': 0.0004948518747057626, 'samples': 2222976, 'steps': 11577, 'loss/train': 1.4765523672103882} +11/06/2021 22:51:04 - INFO - __main__ - Step 11579: {'lr': 0.0004948508032538578, 'samples': 2223168, 'steps': 11578, 'loss/train': 1.918787956237793} +11/06/2021 22:51:04 - INFO - __main__ - Step 11580: {'lr': 0.0004948497316916267, 'samples': 2223360, 'steps': 11579, 'loss/train': 2.0067150592803955} +11/06/2021 22:51:04 - INFO - __main__ - Step 11581: {'lr': 0.0004948486600190702, 'samples': 2223552, 'steps': 11580, 'loss/train': 1.6319156885147095} +11/06/2021 22:51:05 - INFO - __main__ - Step 11582: {'lr': 0.0004948475882361888, 'samples': 2223744, 'steps': 11581, 'loss/train': 1.4225183725357056} +11/06/2021 22:51:05 - INFO - __main__ - Step 11583: {'lr': 0.0004948465163429828, 'samples': 2223936, 'steps': 11582, 'loss/train': 1.5520676374435425} +11/06/2021 22:51:06 - INFO - __main__ - Step 11584: {'lr': 0.0004948454443394527, 'samples': 2224128, 'steps': 11583, 'loss/train': 1.5501137971878052} +11/06/2021 22:51:07 - INFO - __main__ - Step 11585: {'lr': 0.000494844372225599, 'samples': 2224320, 'steps': 11584, 'loss/train': 1.650390625} +11/06/2021 22:51:07 - INFO - __main__ - Step 11586: {'lr': 0.0004948433000014222, 'samples': 2224512, 'steps': 11585, 'loss/train': 1.4051388502120972} +11/06/2021 22:51:07 - INFO - __main__ - Step 11587: {'lr': 0.0004948422276669228, 'samples': 2224704, 'steps': 11586, 'loss/train': 1.91586434841156} +11/06/2021 22:51:08 - INFO - __main__ - Step 11588: {'lr': 0.0004948411552221012, 'samples': 2224896, 'steps': 11587, 'loss/train': 2.1239876747131348} +11/06/2021 22:51:09 - INFO - __main__ - Step 11589: {'lr': 0.000494840082666958, 'samples': 2225088, 'steps': 11588, 'loss/train': 1.9688409566879272} +11/06/2021 22:51:09 - INFO - __main__ - Step 11590: {'lr': 0.0004948390100014937, 'samples': 2225280, 'steps': 11589, 'loss/train': 1.567671775817871} +11/06/2021 22:51:09 - INFO - __main__ - Step 11591: {'lr': 0.0004948379372257086, 'samples': 2225472, 'steps': 11590, 'loss/train': 1.2471174001693726} +11/06/2021 22:51:10 - INFO - __main__ - Step 11592: {'lr': 0.0004948368643396035, 'samples': 2225664, 'steps': 11591, 'loss/train': 1.732541799545288} +11/06/2021 22:51:10 - INFO - __main__ - Step 11593: {'lr': 0.0004948357913431786, 'samples': 2225856, 'steps': 11592, 'loss/train': 1.8311717510223389} +11/06/2021 22:51:11 - INFO - __main__ - Step 11594: {'lr': 0.0004948347182364344, 'samples': 2226048, 'steps': 11593, 'loss/train': 2.0419249534606934} +11/06/2021 22:51:11 - INFO - __main__ - Step 11595: {'lr': 0.0004948336450193715, 'samples': 2226240, 'steps': 11594, 'loss/train': 0.42051059007644653} +11/06/2021 22:51:12 - INFO - __main__ - Step 11596: {'lr': 0.0004948325716919904, 'samples': 2226432, 'steps': 11595, 'loss/train': 2.2684004306793213} +11/06/2021 22:51:12 - INFO - __main__ - Step 11597: {'lr': 0.0004948314982542914, 'samples': 2226624, 'steps': 11596, 'loss/train': 1.7309365272521973} +11/06/2021 22:51:13 - INFO - __main__ - Step 11598: {'lr': 0.0004948304247062752, 'samples': 2226816, 'steps': 11597, 'loss/train': 1.4194977283477783} +11/06/2021 22:51:14 - INFO - __main__ - Step 11599: {'lr': 0.0004948293510479421, 'samples': 2227008, 'steps': 11598, 'loss/train': 0.8019549250602722} +11/06/2021 22:51:14 - INFO - __main__ - Step 11600: {'lr': 0.0004948282772792927, 'samples': 2227200, 'steps': 11599, 'loss/train': 1.8629350662231445} +11/06/2021 22:51:14 - INFO - __main__ - Step 11601: {'lr': 0.0004948272034003275, 'samples': 2227392, 'steps': 11600, 'loss/train': 1.8861653804779053} +11/06/2021 22:51:15 - INFO - __main__ - Step 11602: {'lr': 0.000494826129411047, 'samples': 2227584, 'steps': 11601, 'loss/train': 1.1293734312057495} +11/06/2021 22:51:15 - INFO - __main__ - Step 11603: {'lr': 0.0004948250553114516, 'samples': 2227776, 'steps': 11602, 'loss/train': 1.6663720607757568} +11/06/2021 22:51:15 - INFO - __main__ - Step 11604: {'lr': 0.0004948239811015416, 'samples': 2227968, 'steps': 11603, 'loss/train': 1.6033754348754883} +11/06/2021 22:51:16 - INFO - __main__ - Step 11605: {'lr': 0.0004948229067813179, 'samples': 2228160, 'steps': 11604, 'loss/train': 1.3643414974212646} +11/06/2021 22:51:17 - INFO - __main__ - Step 11606: {'lr': 0.0004948218323507807, 'samples': 2228352, 'steps': 11605, 'loss/train': 2.118734836578369} +11/06/2021 22:51:17 - INFO - __main__ - Step 11607: {'lr': 0.0004948207578099306, 'samples': 2228544, 'steps': 11606, 'loss/train': 1.5554416179656982} +11/06/2021 22:51:17 - INFO - __main__ - Step 11608: {'lr': 0.000494819683158768, 'samples': 2228736, 'steps': 11607, 'loss/train': 1.433336615562439} +11/06/2021 22:51:18 - INFO - __main__ - Step 11609: {'lr': 0.0004948186083972934, 'samples': 2228928, 'steps': 11608, 'loss/train': 1.552068829536438} +11/06/2021 22:51:19 - INFO - __main__ - Step 11610: {'lr': 0.0004948175335255075, 'samples': 2229120, 'steps': 11609, 'loss/train': 1.240715503692627} +11/06/2021 22:51:19 - INFO - __main__ - Step 11611: {'lr': 0.0004948164585434104, 'samples': 2229312, 'steps': 11610, 'loss/train': 1.7166132926940918} +11/06/2021 22:51:20 - INFO - __main__ - Step 11612: {'lr': 0.0004948153834510028, 'samples': 2229504, 'steps': 11611, 'loss/train': 1.7382307052612305} +11/06/2021 22:51:20 - INFO - __main__ - Step 11613: {'lr': 0.0004948143082482852, 'samples': 2229696, 'steps': 11612, 'loss/train': 1.9601466655731201} +11/06/2021 22:51:20 - INFO - __main__ - Step 11614: {'lr': 0.0004948132329352582, 'samples': 2229888, 'steps': 11613, 'loss/train': 1.7500718832015991} +11/06/2021 22:51:21 - INFO - __main__ - Step 11615: {'lr': 0.0004948121575119219, 'samples': 2230080, 'steps': 11614, 'loss/train': 5.872844696044922} +11/06/2021 22:51:22 - INFO - __main__ - Step 11616: {'lr': 0.0004948110819782771, 'samples': 2230272, 'steps': 11615, 'loss/train': 1.6911870241165161} +11/06/2021 22:51:22 - INFO - __main__ - Step 11617: {'lr': 0.0004948100063343243, 'samples': 2230464, 'steps': 11616, 'loss/train': 1.594088077545166} +11/06/2021 22:51:22 - INFO - __main__ - Step 11618: {'lr': 0.0004948089305800638, 'samples': 2230656, 'steps': 11617, 'loss/train': 1.9734327793121338} +11/06/2021 22:51:23 - INFO - __main__ - Step 11619: {'lr': 0.0004948078547154962, 'samples': 2230848, 'steps': 11618, 'loss/train': 1.6274333000183105} +11/06/2021 22:51:24 - INFO - __main__ - Step 11620: {'lr': 0.0004948067787406219, 'samples': 2231040, 'steps': 11619, 'loss/train': 2.051081418991089} +11/06/2021 22:51:24 - INFO - __main__ - Step 11621: {'lr': 0.0004948057026554415, 'samples': 2231232, 'steps': 11620, 'loss/train': 1.4982271194458008} +11/06/2021 22:51:24 - INFO - __main__ - Step 11622: {'lr': 0.0004948046264599554, 'samples': 2231424, 'steps': 11621, 'loss/train': 1.4409050941467285} +11/06/2021 22:51:25 - INFO - __main__ - Step 11623: {'lr': 0.0004948035501541641, 'samples': 2231616, 'steps': 11622, 'loss/train': 2.061194658279419} +11/06/2021 22:51:25 - INFO - __main__ - Step 11624: {'lr': 0.0004948024737380681, 'samples': 2231808, 'steps': 11623, 'loss/train': 1.7897642850875854} +11/06/2021 22:51:26 - INFO - __main__ - Step 11625: {'lr': 0.000494801397211668, 'samples': 2232000, 'steps': 11624, 'loss/train': 1.5584590435028076} +11/06/2021 22:51:27 - INFO - __main__ - Step 11626: {'lr': 0.000494800320574964, 'samples': 2232192, 'steps': 11625, 'loss/train': 1.4107680320739746} +11/06/2021 22:51:27 - INFO - __main__ - Step 11627: {'lr': 0.0004947992438279568, 'samples': 2232384, 'steps': 11626, 'loss/train': 1.7100175619125366} +11/06/2021 22:51:27 - INFO - __main__ - Step 11628: {'lr': 0.0004947981669706469, 'samples': 2232576, 'steps': 11627, 'loss/train': 1.3465707302093506} +11/06/2021 22:51:28 - INFO - __main__ - Step 11629: {'lr': 0.0004947970900030346, 'samples': 2232768, 'steps': 11628, 'loss/train': 1.6569414138793945} +11/06/2021 22:51:28 - INFO - __main__ - Step 11630: {'lr': 0.0004947960129251206, 'samples': 2232960, 'steps': 11629, 'loss/train': 1.8013361692428589} +11/06/2021 22:51:29 - INFO - __main__ - Step 11631: {'lr': 0.0004947949357369054, 'samples': 2233152, 'steps': 11630, 'loss/train': 1.4865167140960693} +11/06/2021 22:51:29 - INFO - __main__ - Step 11632: {'lr': 0.0004947938584383892, 'samples': 2233344, 'steps': 11631, 'loss/train': 2.1401309967041016} +11/06/2021 22:51:30 - INFO - __main__ - Step 11633: {'lr': 0.0004947927810295728, 'samples': 2233536, 'steps': 11632, 'loss/train': 1.6527354717254639} +11/06/2021 22:51:30 - INFO - __main__ - Step 11634: {'lr': 0.0004947917035104564, 'samples': 2233728, 'steps': 11633, 'loss/train': 1.9105935096740723} +11/06/2021 22:51:30 - INFO - __main__ - Step 11635: {'lr': 0.0004947906258810407, 'samples': 2233920, 'steps': 11634, 'loss/train': 1.906631350517273} +11/06/2021 22:51:31 - INFO - __main__ - Step 11636: {'lr': 0.0004947895481413262, 'samples': 2234112, 'steps': 11635, 'loss/train': 2.1798081398010254} +11/06/2021 22:51:32 - INFO - __main__ - Step 11637: {'lr': 0.0004947884702913133, 'samples': 2234304, 'steps': 11636, 'loss/train': 1.9816797971725464} +11/06/2021 22:51:32 - INFO - __main__ - Step 11638: {'lr': 0.0004947873923310024, 'samples': 2234496, 'steps': 11637, 'loss/train': 1.7533513307571411} +11/06/2021 22:51:32 - INFO - __main__ - Step 11639: {'lr': 0.0004947863142603941, 'samples': 2234688, 'steps': 11638, 'loss/train': 1.5233229398727417} +11/06/2021 22:51:33 - INFO - __main__ - Step 11640: {'lr': 0.0004947852360794889, 'samples': 2234880, 'steps': 11639, 'loss/train': 1.628521203994751} +11/06/2021 22:51:34 - INFO - __main__ - Step 11641: {'lr': 0.0004947841577882873, 'samples': 2235072, 'steps': 11640, 'loss/train': 1.8481824398040771} +11/06/2021 22:51:34 - INFO - __main__ - Step 11642: {'lr': 0.0004947830793867896, 'samples': 2235264, 'steps': 11641, 'loss/train': 2.2054293155670166} +11/06/2021 22:51:34 - INFO - __main__ - Step 11643: {'lr': 0.0004947820008749965, 'samples': 2235456, 'steps': 11642, 'loss/train': 1.8366459608078003} +11/06/2021 22:51:35 - INFO - __main__ - Step 11644: {'lr': 0.0004947809222529084, 'samples': 2235648, 'steps': 11643, 'loss/train': 1.237697720527649} +11/06/2021 22:51:35 - INFO - __main__ - Step 11645: {'lr': 0.0004947798435205258, 'samples': 2235840, 'steps': 11644, 'loss/train': 1.8298448324203491} +11/06/2021 22:51:36 - INFO - __main__ - Step 11646: {'lr': 0.0004947787646778491, 'samples': 2236032, 'steps': 11645, 'loss/train': 1.7138854265213013} +11/06/2021 22:51:36 - INFO - __main__ - Step 11647: {'lr': 0.0004947776857248791, 'samples': 2236224, 'steps': 11646, 'loss/train': 1.7913033962249756} +11/06/2021 22:51:37 - INFO - __main__ - Step 11648: {'lr': 0.0004947766066616157, 'samples': 2236416, 'steps': 11647, 'loss/train': 1.7357981204986572} +11/06/2021 22:51:37 - INFO - __main__ - Step 11649: {'lr': 0.00049477552748806, 'samples': 2236608, 'steps': 11648, 'loss/train': 1.6491725444793701} +11/06/2021 22:51:38 - INFO - __main__ - Step 11650: {'lr': 0.0004947744482042122, 'samples': 2236800, 'steps': 11649, 'loss/train': 1.3429278135299683} +11/06/2021 22:51:38 - INFO - __main__ - Step 11651: {'lr': 0.0004947733688100728, 'samples': 2236992, 'steps': 11650, 'loss/train': 1.4097791910171509} +11/06/2021 22:51:39 - INFO - __main__ - Step 11652: {'lr': 0.0004947722893056423, 'samples': 2237184, 'steps': 11651, 'loss/train': 1.9435794353485107} +11/06/2021 22:51:39 - INFO - __main__ - Step 11653: {'lr': 0.0004947712096909211, 'samples': 2237376, 'steps': 11652, 'loss/train': 1.272664189338684} +11/06/2021 22:51:40 - INFO - __main__ - Step 11654: {'lr': 0.0004947701299659097, 'samples': 2237568, 'steps': 11653, 'loss/train': 1.6220483779907227} +11/06/2021 22:51:40 - INFO - __main__ - Step 11655: {'lr': 0.0004947690501306088, 'samples': 2237760, 'steps': 11654, 'loss/train': 2.2113709449768066} +11/06/2021 22:51:40 - INFO - __main__ - Step 11656: {'lr': 0.0004947679701850187, 'samples': 2237952, 'steps': 11655, 'loss/train': 1.6100585460662842} +11/06/2021 22:51:41 - INFO - __main__ - Step 11657: {'lr': 0.00049476689012914, 'samples': 2238144, 'steps': 11656, 'loss/train': 1.5602444410324097} +11/06/2021 22:51:42 - INFO - __main__ - Step 11658: {'lr': 0.0004947658099629731, 'samples': 2238336, 'steps': 11657, 'loss/train': 1.4081251621246338} +11/06/2021 22:51:42 - INFO - __main__ - Step 11659: {'lr': 0.0004947647296865184, 'samples': 2238528, 'steps': 11658, 'loss/train': 1.445473074913025} +11/06/2021 22:51:42 - INFO - __main__ - Step 11660: {'lr': 0.0004947636492997765, 'samples': 2238720, 'steps': 11659, 'loss/train': 1.6339030265808105} +11/06/2021 22:51:43 - INFO - __main__ - Step 11661: {'lr': 0.0004947625688027479, 'samples': 2238912, 'steps': 11660, 'loss/train': 1.8317729234695435} +11/06/2021 22:51:44 - INFO - __main__ - Step 11662: {'lr': 0.0004947614881954332, 'samples': 2239104, 'steps': 11661, 'loss/train': 1.262568712234497} +11/06/2021 22:51:44 - INFO - __main__ - Step 11663: {'lr': 0.0004947604074778325, 'samples': 2239296, 'steps': 11662, 'loss/train': 1.5094019174575806} +11/06/2021 22:51:45 - INFO - __main__ - Step 11664: {'lr': 0.0004947593266499468, 'samples': 2239488, 'steps': 11663, 'loss/train': 1.4688637256622314} +11/06/2021 22:51:45 - INFO - __main__ - Step 11665: {'lr': 0.0004947582457117762, 'samples': 2239680, 'steps': 11664, 'loss/train': 2.3043243885040283} +11/06/2021 22:51:45 - INFO - __main__ - Step 11666: {'lr': 0.0004947571646633214, 'samples': 2239872, 'steps': 11665, 'loss/train': 1.4841505289077759} +11/06/2021 22:51:46 - INFO - __main__ - Step 11667: {'lr': 0.0004947560835045826, 'samples': 2240064, 'steps': 11666, 'loss/train': 1.7168904542922974} +11/06/2021 22:51:47 - INFO - __main__ - Step 11668: {'lr': 0.0004947550022355606, 'samples': 2240256, 'steps': 11667, 'loss/train': 1.6431477069854736} +11/06/2021 22:51:47 - INFO - __main__ - Step 11669: {'lr': 0.0004947539208562558, 'samples': 2240448, 'steps': 11668, 'loss/train': 0.3917955160140991} +11/06/2021 22:51:47 - INFO - __main__ - Step 11670: {'lr': 0.0004947528393666686, 'samples': 2240640, 'steps': 11669, 'loss/train': 1.4626667499542236} +11/06/2021 22:51:48 - INFO - __main__ - Step 11671: {'lr': 0.0004947517577667996, 'samples': 2240832, 'steps': 11670, 'loss/train': 1.9244534969329834} +11/06/2021 22:51:48 - INFO - __main__ - Step 11672: {'lr': 0.0004947506760566492, 'samples': 2241024, 'steps': 11671, 'loss/train': 1.6915565729141235} +11/06/2021 22:51:49 - INFO - __main__ - Step 11673: {'lr': 0.0004947495942362179, 'samples': 2241216, 'steps': 11672, 'loss/train': 1.8372933864593506} +11/06/2021 22:51:49 - INFO - __main__ - Step 11674: {'lr': 0.0004947485123055063, 'samples': 2241408, 'steps': 11673, 'loss/train': 1.7340296506881714} +11/06/2021 22:51:50 - INFO - __main__ - Step 11675: {'lr': 0.0004947474302645147, 'samples': 2241600, 'steps': 11674, 'loss/train': 2.306028127670288} +11/06/2021 22:51:50 - INFO - __main__ - Step 11676: {'lr': 0.0004947463481132438, 'samples': 2241792, 'steps': 11675, 'loss/train': 1.5373907089233398} +11/06/2021 22:51:50 - INFO - __main__ - Step 11677: {'lr': 0.0004947452658516938, 'samples': 2241984, 'steps': 11676, 'loss/train': 1.0355230569839478} +11/06/2021 22:51:52 - INFO - __main__ - Step 11678: {'lr': 0.0004947441834798655, 'samples': 2242176, 'steps': 11677, 'loss/train': 1.9624687433242798} +11/06/2021 22:51:52 - INFO - __main__ - Step 11679: {'lr': 0.0004947431009977592, 'samples': 2242368, 'steps': 11678, 'loss/train': 2.2089884281158447} +11/06/2021 22:51:52 - INFO - __main__ - Step 11680: {'lr': 0.0004947420184053755, 'samples': 2242560, 'steps': 11679, 'loss/train': 1.4249625205993652} +11/06/2021 22:51:53 - INFO - __main__ - Step 11681: {'lr': 0.0004947409357027148, 'samples': 2242752, 'steps': 11680, 'loss/train': 1.3146612644195557} +11/06/2021 22:51:53 - INFO - __main__ - Step 11682: {'lr': 0.0004947398528897775, 'samples': 2242944, 'steps': 11681, 'loss/train': 1.6115343570709229} +11/06/2021 22:51:53 - INFO - __main__ - Step 11683: {'lr': 0.0004947387699665643, 'samples': 2243136, 'steps': 11682, 'loss/train': 2.1556644439697266} +11/06/2021 22:51:54 - INFO - __main__ - Step 11684: {'lr': 0.0004947376869330755, 'samples': 2243328, 'steps': 11683, 'loss/train': 2.4655892848968506} +11/06/2021 22:51:55 - INFO - __main__ - Step 11685: {'lr': 0.0004947366037893118, 'samples': 2243520, 'steps': 11684, 'loss/train': 1.4725700616836548} +11/06/2021 22:51:55 - INFO - __main__ - Step 11686: {'lr': 0.0004947355205352735, 'samples': 2243712, 'steps': 11685, 'loss/train': 1.7428011894226074} +11/06/2021 22:51:55 - INFO - __main__ - Step 11687: {'lr': 0.0004947344371709611, 'samples': 2243904, 'steps': 11686, 'loss/train': 1.42606520652771} +11/06/2021 22:51:56 - INFO - __main__ - Step 11688: {'lr': 0.0004947333536963753, 'samples': 2244096, 'steps': 11687, 'loss/train': 1.7653391361236572} +11/06/2021 22:51:57 - INFO - __main__ - Step 11689: {'lr': 0.0004947322701115163, 'samples': 2244288, 'steps': 11688, 'loss/train': 2.0010745525360107} +11/06/2021 22:51:57 - INFO - __main__ - Step 11690: {'lr': 0.0004947311864163847, 'samples': 2244480, 'steps': 11689, 'loss/train': 1.4831074476242065} +11/06/2021 22:51:58 - INFO - __main__ - Step 11691: {'lr': 0.000494730102610981, 'samples': 2244672, 'steps': 11690, 'loss/train': 1.9865690469741821} +11/06/2021 22:51:58 - INFO - __main__ - Step 11692: {'lr': 0.0004947290186953057, 'samples': 2244864, 'steps': 11691, 'loss/train': 1.3742139339447021} +11/06/2021 22:51:58 - INFO - __main__ - Step 11693: {'lr': 0.0004947279346693594, 'samples': 2245056, 'steps': 11692, 'loss/train': 1.701667308807373} +11/06/2021 22:51:59 - INFO - __main__ - Step 11694: {'lr': 0.0004947268505331424, 'samples': 2245248, 'steps': 11693, 'loss/train': 1.9292877912521362} +11/06/2021 22:52:00 - INFO - __main__ - Step 11695: {'lr': 0.0004947257662866551, 'samples': 2245440, 'steps': 11694, 'loss/train': 2.0025382041931152} +11/06/2021 22:52:00 - INFO - __main__ - Step 11696: {'lr': 0.0004947246819298984, 'samples': 2245632, 'steps': 11695, 'loss/train': 1.10530424118042} +11/06/2021 22:52:00 - INFO - __main__ - Step 11697: {'lr': 0.0004947235974628723, 'samples': 2245824, 'steps': 11696, 'loss/train': 1.703428864479065} +11/06/2021 22:52:01 - INFO - __main__ - Step 11698: {'lr': 0.0004947225128855777, 'samples': 2246016, 'steps': 11697, 'loss/train': 1.4115582704544067} +11/06/2021 22:52:02 - INFO - __main__ - Step 11699: {'lr': 0.0004947214281980149, 'samples': 2246208, 'steps': 11698, 'loss/train': 1.6013803482055664} +11/06/2021 22:52:02 - INFO - __main__ - Step 11700: {'lr': 0.0004947203434001843, 'samples': 2246400, 'steps': 11699, 'loss/train': 0.8683410882949829} +11/06/2021 22:52:02 - INFO - __main__ - Step 11701: {'lr': 0.0004947192584920866, 'samples': 2246592, 'steps': 11700, 'loss/train': 1.931963324546814} +11/06/2021 22:52:03 - INFO - __main__ - Step 11702: {'lr': 0.000494718173473722, 'samples': 2246784, 'steps': 11701, 'loss/train': 1.411441683769226} +11/06/2021 22:52:03 - INFO - __main__ - Step 11703: {'lr': 0.0004947170883450913, 'samples': 2246976, 'steps': 11702, 'loss/train': 1.5308102369308472} +11/06/2021 22:52:04 - INFO - __main__ - Step 11704: {'lr': 0.000494716003106195, 'samples': 2247168, 'steps': 11703, 'loss/train': 2.047659158706665} +11/06/2021 22:52:05 - INFO - __main__ - Step 11705: {'lr': 0.0004947149177570332, 'samples': 2247360, 'steps': 11704, 'loss/train': 1.6442228555679321} +11/06/2021 22:52:05 - INFO - __main__ - Step 11706: {'lr': 0.0004947138322976067, 'samples': 2247552, 'steps': 11705, 'loss/train': 1.791576623916626} +11/06/2021 22:52:05 - INFO - __main__ - Step 11707: {'lr': 0.000494712746727916, 'samples': 2247744, 'steps': 11706, 'loss/train': 1.8355753421783447} +11/06/2021 22:52:06 - INFO - __main__ - Step 11708: {'lr': 0.0004947116610479614, 'samples': 2247936, 'steps': 11707, 'loss/train': 1.7016065120697021} +11/06/2021 22:52:06 - INFO - __main__ - Step 11709: {'lr': 0.0004947105752577436, 'samples': 2248128, 'steps': 11708, 'loss/train': 1.3050994873046875} +11/06/2021 22:52:07 - INFO - __main__ - Step 11710: {'lr': 0.0004947094893572629, 'samples': 2248320, 'steps': 11709, 'loss/train': 1.8479158878326416} +11/06/2021 22:52:08 - INFO - __main__ - Step 11711: {'lr': 0.00049470840334652, 'samples': 2248512, 'steps': 11710, 'loss/train': 1.892972707748413} +11/06/2021 22:52:08 - INFO - __main__ - Step 11712: {'lr': 0.0004947073172255151, 'samples': 2248704, 'steps': 11711, 'loss/train': 2.1024181842803955} +11/06/2021 22:52:08 - INFO - __main__ - Step 11713: {'lr': 0.000494706230994249, 'samples': 2248896, 'steps': 11712, 'loss/train': 1.7337501049041748} +11/06/2021 22:52:09 - INFO - __main__ - Step 11714: {'lr': 0.000494705144652722, 'samples': 2249088, 'steps': 11713, 'loss/train': 2.053222894668579} +11/06/2021 22:52:10 - INFO - __main__ - Step 11715: {'lr': 0.0004947040582009346, 'samples': 2249280, 'steps': 11714, 'loss/train': 1.5705617666244507} +11/06/2021 22:52:10 - INFO - __main__ - Step 11716: {'lr': 0.0004947029716388875, 'samples': 2249472, 'steps': 11715, 'loss/train': 1.1817337274551392} +11/06/2021 22:52:11 - INFO - __main__ - Step 11717: {'lr': 0.0004947018849665809, 'samples': 2249664, 'steps': 11716, 'loss/train': 1.7236446142196655} +11/06/2021 22:52:11 - INFO - __main__ - Step 11718: {'lr': 0.0004947007981840153, 'samples': 2249856, 'steps': 11717, 'loss/train': 1.561780571937561} +11/06/2021 22:52:11 - INFO - __main__ - Step 11719: {'lr': 0.0004946997112911914, 'samples': 2250048, 'steps': 11718, 'loss/train': 1.9812180995941162} +11/06/2021 22:52:12 - INFO - __main__ - Step 11720: {'lr': 0.0004946986242881096, 'samples': 2250240, 'steps': 11719, 'loss/train': 2.1320106983184814} +11/06/2021 22:52:13 - INFO - __main__ - Step 11721: {'lr': 0.0004946975371747704, 'samples': 2250432, 'steps': 11720, 'loss/train': 2.156588315963745} +11/06/2021 22:52:13 - INFO - __main__ - Step 11722: {'lr': 0.0004946964499511742, 'samples': 2250624, 'steps': 11721, 'loss/train': 1.9945005178451538} +11/06/2021 22:52:13 - INFO - __main__ - Step 11723: {'lr': 0.0004946953626173216, 'samples': 2250816, 'steps': 11722, 'loss/train': 1.00374174118042} +11/06/2021 22:52:14 - INFO - __main__ - Step 11724: {'lr': 0.0004946942751732129, 'samples': 2251008, 'steps': 11723, 'loss/train': 1.2549642324447632} +11/06/2021 22:52:14 - INFO - __main__ - Step 11725: {'lr': 0.000494693187618849, 'samples': 2251200, 'steps': 11724, 'loss/train': 1.6982334852218628} +11/06/2021 22:52:15 - INFO - __main__ - Step 11726: {'lr': 0.0004946920999542299, 'samples': 2251392, 'steps': 11725, 'loss/train': 5.76206636428833} +11/06/2021 22:52:15 - INFO - __main__ - Step 11727: {'lr': 0.0004946910121793564, 'samples': 2251584, 'steps': 11726, 'loss/train': 1.8769844770431519} +11/06/2021 22:52:16 - INFO - __main__ - Step 11728: {'lr': 0.0004946899242942289, 'samples': 2251776, 'steps': 11727, 'loss/train': 1.1642225980758667} +11/06/2021 22:52:16 - INFO - __main__ - Step 11729: {'lr': 0.000494688836298848, 'samples': 2251968, 'steps': 11728, 'loss/train': 1.9926396608352661} +11/06/2021 22:52:16 - INFO - __main__ - Step 11730: {'lr': 0.0004946877481932139, 'samples': 2252160, 'steps': 11729, 'loss/train': 1.9353605508804321} +11/06/2021 22:52:17 - INFO - __main__ - Step 11731: {'lr': 0.0004946866599773274, 'samples': 2252352, 'steps': 11730, 'loss/train': 1.884238839149475} +11/06/2021 22:52:18 - INFO - __main__ - Step 11732: {'lr': 0.0004946855716511888, 'samples': 2252544, 'steps': 11731, 'loss/train': 2.3865725994110107} +11/06/2021 22:52:18 - INFO - __main__ - Step 11733: {'lr': 0.0004946844832147987, 'samples': 2252736, 'steps': 11732, 'loss/train': 1.7648876905441284} +11/06/2021 22:52:18 - INFO - __main__ - Step 11734: {'lr': 0.0004946833946681575, 'samples': 2252928, 'steps': 11733, 'loss/train': 1.9588221311569214} +11/06/2021 22:52:19 - INFO - __main__ - Step 11735: {'lr': 0.0004946823060112658, 'samples': 2253120, 'steps': 11734, 'loss/train': 1.0032458305358887} +11/06/2021 22:52:20 - INFO - __main__ - Step 11736: {'lr': 0.000494681217244124, 'samples': 2253312, 'steps': 11735, 'loss/train': 1.9610958099365234} +11/06/2021 22:52:20 - INFO - __main__ - Step 11737: {'lr': 0.0004946801283667326, 'samples': 2253504, 'steps': 11736, 'loss/train': 1.6213114261627197} +11/06/2021 22:52:21 - INFO - __main__ - Step 11738: {'lr': 0.0004946790393790921, 'samples': 2253696, 'steps': 11737, 'loss/train': 1.8059797286987305} +11/06/2021 22:52:21 - INFO - __main__ - Step 11739: {'lr': 0.0004946779502812031, 'samples': 2253888, 'steps': 11738, 'loss/train': 2.2257320880889893} +11/06/2021 22:52:21 - INFO - __main__ - Step 11740: {'lr': 0.0004946768610730659, 'samples': 2254080, 'steps': 11739, 'loss/train': 1.6921347379684448} +11/06/2021 22:52:22 - INFO - __main__ - Step 11741: {'lr': 0.0004946757717546812, 'samples': 2254272, 'steps': 11740, 'loss/train': 1.7304112911224365} +11/06/2021 22:52:23 - INFO - __main__ - Step 11742: {'lr': 0.0004946746823260491, 'samples': 2254464, 'steps': 11741, 'loss/train': 0.8344317078590393} +11/06/2021 22:52:23 - INFO - __main__ - Step 11743: {'lr': 0.0004946735927871706, 'samples': 2254656, 'steps': 11742, 'loss/train': 1.438720941543579} +11/06/2021 22:52:23 - INFO - __main__ - Step 11744: {'lr': 0.0004946725031380459, 'samples': 2254848, 'steps': 11743, 'loss/train': 2.020857572555542} +11/06/2021 22:52:24 - INFO - __main__ - Step 11745: {'lr': 0.0004946714133786756, 'samples': 2255040, 'steps': 11744, 'loss/train': 1.5829726457595825} +11/06/2021 22:52:24 - INFO - __main__ - Step 11746: {'lr': 0.00049467032350906, 'samples': 2255232, 'steps': 11745, 'loss/train': 1.7040636539459229} +11/06/2021 22:52:25 - INFO - __main__ - Step 11747: {'lr': 0.0004946692335291999, 'samples': 2255424, 'steps': 11746, 'loss/train': 1.7753183841705322} +11/06/2021 22:52:26 - INFO - __main__ - Step 11748: {'lr': 0.0004946681434390955, 'samples': 2255616, 'steps': 11747, 'loss/train': 2.8313393592834473} +11/06/2021 22:52:26 - INFO - __main__ - Step 11749: {'lr': 0.0004946670532387474, 'samples': 2255808, 'steps': 11748, 'loss/train': 1.4932595491409302} +11/06/2021 22:52:26 - INFO - __main__ - Step 11750: {'lr': 0.0004946659629281561, 'samples': 2256000, 'steps': 11749, 'loss/train': 1.6414493322372437} +11/06/2021 22:52:27 - INFO - __main__ - Step 11751: {'lr': 0.0004946648725073222, 'samples': 2256192, 'steps': 11750, 'loss/train': 1.8771973848342896} +11/06/2021 22:52:27 - INFO - __main__ - Step 11752: {'lr': 0.0004946637819762459, 'samples': 2256384, 'steps': 11751, 'loss/train': 1.819173812866211} +11/06/2021 22:52:28 - INFO - __main__ - Step 11753: {'lr': 0.000494662691334928, 'samples': 2256576, 'steps': 11752, 'loss/train': 1.7248607873916626} +11/06/2021 22:52:29 - INFO - __main__ - Step 11754: {'lr': 0.0004946616005833689, 'samples': 2256768, 'steps': 11753, 'loss/train': 1.390769362449646} +11/06/2021 22:52:29 - INFO - __main__ - Step 11755: {'lr': 0.0004946605097215691, 'samples': 2256960, 'steps': 11754, 'loss/train': 1.4197173118591309} +11/06/2021 22:52:29 - INFO - __main__ - Step 11756: {'lr': 0.0004946594187495289, 'samples': 2257152, 'steps': 11755, 'loss/train': 1.846717357635498} +11/06/2021 22:52:30 - INFO - __main__ - Step 11757: {'lr': 0.0004946583276672489, 'samples': 2257344, 'steps': 11756, 'loss/train': 1.6870449781417847} +11/06/2021 22:52:31 - INFO - __main__ - Step 11758: {'lr': 0.0004946572364747298, 'samples': 2257536, 'steps': 11757, 'loss/train': 1.6424260139465332} +11/06/2021 22:52:31 - INFO - __main__ - Step 11759: {'lr': 0.0004946561451719719, 'samples': 2257728, 'steps': 11758, 'loss/train': 1.8925001621246338} +11/06/2021 22:52:32 - INFO - __main__ - Step 11760: {'lr': 0.0004946550537589757, 'samples': 2257920, 'steps': 11759, 'loss/train': 1.6655386686325073} +11/06/2021 22:52:32 - INFO - __main__ - Step 11761: {'lr': 0.0004946539622357417, 'samples': 2258112, 'steps': 11760, 'loss/train': 1.9449368715286255} +11/06/2021 22:52:32 - INFO - __main__ - Step 11762: {'lr': 0.0004946528706022703, 'samples': 2258304, 'steps': 11761, 'loss/train': 2.078275442123413} +11/06/2021 22:52:33 - INFO - __main__ - Step 11763: {'lr': 0.0004946517788585622, 'samples': 2258496, 'steps': 11762, 'loss/train': 1.4620633125305176} +11/06/2021 22:52:34 - INFO - __main__ - Step 11764: {'lr': 0.0004946506870046178, 'samples': 2258688, 'steps': 11763, 'loss/train': 1.66291344165802} +11/06/2021 22:52:34 - INFO - __main__ - Step 11765: {'lr': 0.0004946495950404375, 'samples': 2258880, 'steps': 11764, 'loss/train': 1.7311233282089233} +11/06/2021 22:52:34 - INFO - __main__ - Step 11766: {'lr': 0.0004946485029660219, 'samples': 2259072, 'steps': 11765, 'loss/train': 1.9496246576309204} +11/06/2021 22:52:35 - INFO - __main__ - Step 11767: {'lr': 0.0004946474107813715, 'samples': 2259264, 'steps': 11766, 'loss/train': 1.842336654663086} +11/06/2021 22:52:35 - INFO - __main__ - Step 11768: {'lr': 0.0004946463184864867, 'samples': 2259456, 'steps': 11767, 'loss/train': 1.8693801164627075} +11/06/2021 22:52:36 - INFO - __main__ - Step 11769: {'lr': 0.000494645226081368, 'samples': 2259648, 'steps': 11768, 'loss/train': 1.6797724962234497} +11/06/2021 22:52:36 - INFO - __main__ - Step 11770: {'lr': 0.000494644133566016, 'samples': 2259840, 'steps': 11769, 'loss/train': 1.4810084104537964} +11/06/2021 22:52:37 - INFO - __main__ - Step 11771: {'lr': 0.0004946430409404311, 'samples': 2260032, 'steps': 11770, 'loss/train': 1.5809372663497925} +11/06/2021 22:52:37 - INFO - __main__ - Step 11772: {'lr': 0.0004946419482046139, 'samples': 2260224, 'steps': 11771, 'loss/train': 1.3877747058868408} +11/06/2021 22:52:38 - INFO - __main__ - Step 11773: {'lr': 0.0004946408553585648, 'samples': 2260416, 'steps': 11772, 'loss/train': 1.1509099006652832} +11/06/2021 22:52:38 - INFO - __main__ - Step 11774: {'lr': 0.0004946397624022843, 'samples': 2260608, 'steps': 11773, 'loss/train': 2.2780723571777344} +11/06/2021 22:52:39 - INFO - __main__ - Step 11775: {'lr': 0.0004946386693357728, 'samples': 2260800, 'steps': 11774, 'loss/train': 1.5526584386825562} +11/06/2021 22:52:39 - INFO - __main__ - Step 11776: {'lr': 0.0004946375761590309, 'samples': 2260992, 'steps': 11775, 'loss/train': 2.048732280731201} +11/06/2021 22:52:39 - INFO - __main__ - Step 11777: {'lr': 0.0004946364828720592, 'samples': 2261184, 'steps': 11776, 'loss/train': 1.518662929534912} +11/06/2021 22:52:40 - INFO - __main__ - Step 11778: {'lr': 0.000494635389474858, 'samples': 2261376, 'steps': 11777, 'loss/train': 2.078202962875366} +11/06/2021 22:52:41 - INFO - __main__ - Step 11779: {'lr': 0.0004946342959674278, 'samples': 2261568, 'steps': 11778, 'loss/train': 1.6700574159622192} +11/06/2021 22:52:41 - INFO - __main__ - Step 11780: {'lr': 0.0004946332023497693, 'samples': 2261760, 'steps': 11779, 'loss/train': 2.0931074619293213} +11/06/2021 22:52:42 - INFO - __main__ - Step 11781: {'lr': 0.0004946321086218828, 'samples': 2261952, 'steps': 11780, 'loss/train': 1.8575305938720703} +11/06/2021 22:52:42 - INFO - __main__ - Step 11782: {'lr': 0.0004946310147837689, 'samples': 2262144, 'steps': 11781, 'loss/train': 1.1181639432907104} +11/06/2021 22:52:42 - INFO - __main__ - Step 11783: {'lr': 0.0004946299208354279, 'samples': 2262336, 'steps': 11782, 'loss/train': 1.7613064050674438} +11/06/2021 22:52:43 - INFO - __main__ - Step 11784: {'lr': 0.0004946288267768605, 'samples': 2262528, 'steps': 11783, 'loss/train': 1.5127317905426025} +11/06/2021 22:52:44 - INFO - __main__ - Step 11785: {'lr': 0.0004946277326080672, 'samples': 2262720, 'steps': 11784, 'loss/train': 1.9431092739105225} +11/06/2021 22:52:44 - INFO - __main__ - Step 11786: {'lr': 0.0004946266383290483, 'samples': 2262912, 'steps': 11785, 'loss/train': 2.022489547729492} +11/06/2021 22:52:44 - INFO - __main__ - Step 11787: {'lr': 0.0004946255439398045, 'samples': 2263104, 'steps': 11786, 'loss/train': 1.829660177230835} +11/06/2021 22:52:45 - INFO - __main__ - Step 11788: {'lr': 0.0004946244494403361, 'samples': 2263296, 'steps': 11787, 'loss/train': 1.7674616575241089} +11/06/2021 22:52:45 - INFO - __main__ - Step 11789: {'lr': 0.0004946233548306438, 'samples': 2263488, 'steps': 11788, 'loss/train': 1.8133692741394043} +11/06/2021 22:52:46 - INFO - __main__ - Step 11790: {'lr': 0.000494622260110728, 'samples': 2263680, 'steps': 11789, 'loss/train': 1.611851453781128} +11/06/2021 22:52:46 - INFO - __main__ - Step 11791: {'lr': 0.0004946211652805891, 'samples': 2263872, 'steps': 11790, 'loss/train': 1.1969035863876343} +11/06/2021 22:52:47 - INFO - __main__ - Step 11792: {'lr': 0.0004946200703402278, 'samples': 2264064, 'steps': 11791, 'loss/train': 2.1586251258850098} +11/06/2021 22:52:47 - INFO - __main__ - Step 11793: {'lr': 0.0004946189752896443, 'samples': 2264256, 'steps': 11792, 'loss/train': 1.361173152923584} +11/06/2021 22:52:47 - INFO - __main__ - Step 11794: {'lr': 0.0004946178801288394, 'samples': 2264448, 'steps': 11793, 'loss/train': 1.3458670377731323} +11/06/2021 22:52:48 - INFO - __main__ - Step 11795: {'lr': 0.0004946167848578134, 'samples': 2264640, 'steps': 11794, 'loss/train': 1.4906079769134521} +11/06/2021 22:52:49 - INFO - __main__ - Step 11796: {'lr': 0.0004946156894765669, 'samples': 2264832, 'steps': 11795, 'loss/train': 1.776194453239441} +11/06/2021 22:52:49 - INFO - __main__ - Step 11797: {'lr': 0.0004946145939851004, 'samples': 2265024, 'steps': 11796, 'loss/train': 1.1889792680740356} +11/06/2021 22:52:49 - INFO - __main__ - Step 11798: {'lr': 0.0004946134983834142, 'samples': 2265216, 'steps': 11797, 'loss/train': 1.3798962831497192} +11/06/2021 22:52:50 - INFO - __main__ - Step 11799: {'lr': 0.0004946124026715089, 'samples': 2265408, 'steps': 11798, 'loss/train': 1.1393816471099854} +11/06/2021 22:52:51 - INFO - __main__ - Step 11800: {'lr': 0.0004946113068493851, 'samples': 2265600, 'steps': 11799, 'loss/train': 1.938144326210022} +11/06/2021 22:52:51 - INFO - __main__ - Step 11801: {'lr': 0.0004946102109170433, 'samples': 2265792, 'steps': 11800, 'loss/train': 1.085551381111145} +11/06/2021 22:52:52 - INFO - __main__ - Step 11802: {'lr': 0.0004946091148744838, 'samples': 2265984, 'steps': 11801, 'loss/train': 1.9782894849777222} +11/06/2021 22:52:52 - INFO - __main__ - Step 11803: {'lr': 0.0004946080187217072, 'samples': 2266176, 'steps': 11802, 'loss/train': 1.8065892457962036} +11/06/2021 22:52:52 - INFO - __main__ - Step 11804: {'lr': 0.0004946069224587141, 'samples': 2266368, 'steps': 11803, 'loss/train': 1.8885177373886108} +11/06/2021 22:52:53 - INFO - __main__ - Step 11805: {'lr': 0.0004946058260855049, 'samples': 2266560, 'steps': 11804, 'loss/train': 1.6581742763519287} +11/06/2021 22:52:54 - INFO - __main__ - Step 11806: {'lr': 0.00049460472960208, 'samples': 2266752, 'steps': 11805, 'loss/train': 1.8669217824935913} +11/06/2021 22:52:54 - INFO - __main__ - Step 11807: {'lr': 0.00049460363300844, 'samples': 2266944, 'steps': 11806, 'loss/train': 1.47137451171875} +11/06/2021 22:52:54 - INFO - __main__ - Step 11808: {'lr': 0.0004946025363045854, 'samples': 2267136, 'steps': 11807, 'loss/train': 1.8952033519744873} +11/06/2021 22:52:55 - INFO - __main__ - Step 11809: {'lr': 0.0004946014394905167, 'samples': 2267328, 'steps': 11808, 'loss/train': 1.2856425046920776} +11/06/2021 22:52:56 - INFO - __main__ - Step 11810: {'lr': 0.0004946003425662343, 'samples': 2267520, 'steps': 11809, 'loss/train': 2.00896954536438} +11/06/2021 22:52:56 - INFO - __main__ - Step 11811: {'lr': 0.0004945992455317389, 'samples': 2267712, 'steps': 11810, 'loss/train': 1.724480390548706} +11/06/2021 22:52:56 - INFO - __main__ - Step 11812: {'lr': 0.0004945981483870307, 'samples': 2267904, 'steps': 11811, 'loss/train': 1.5671536922454834} +11/06/2021 22:52:57 - INFO - __main__ - Step 11813: {'lr': 0.0004945970511321104, 'samples': 2268096, 'steps': 11812, 'loss/train': 2.0063626766204834} +11/06/2021 22:52:57 - INFO - __main__ - Step 11814: {'lr': 0.0004945959537669784, 'samples': 2268288, 'steps': 11813, 'loss/train': 1.2561020851135254} +11/06/2021 22:52:57 - INFO - __main__ - Step 11815: {'lr': 0.0004945948562916353, 'samples': 2268480, 'steps': 11814, 'loss/train': 1.8354805707931519} +11/06/2021 22:52:59 - INFO - __main__ - Step 11816: {'lr': 0.0004945937587060815, 'samples': 2268672, 'steps': 11815, 'loss/train': 1.270841360092163} +11/06/2021 22:53:00 - INFO - __main__ - Step 11817: {'lr': 0.0004945926610103175, 'samples': 2268864, 'steps': 11816, 'loss/train': 1.2347999811172485} +11/06/2021 22:53:00 - INFO - __main__ - Step 11818: {'lr': 0.0004945915632043439, 'samples': 2269056, 'steps': 11817, 'loss/train': 1.340549349784851} +11/06/2021 22:53:00 - INFO - __main__ - Step 11819: {'lr': 0.0004945904652881611, 'samples': 2269248, 'steps': 11818, 'loss/train': 1.905003547668457} +11/06/2021 22:53:01 - INFO - __main__ - Step 11820: {'lr': 0.0004945893672617695, 'samples': 2269440, 'steps': 11819, 'loss/train': 1.818457841873169} +11/06/2021 22:53:01 - INFO - __main__ - Step 11821: {'lr': 0.0004945882691251699, 'samples': 2269632, 'steps': 11820, 'loss/train': 1.8213856220245361} +11/06/2021 22:53:02 - INFO - __main__ - Step 11822: {'lr': 0.0004945871708783625, 'samples': 2269824, 'steps': 11821, 'loss/train': 1.8481453657150269} +11/06/2021 22:53:02 - INFO - __main__ - Step 11823: {'lr': 0.0004945860725213477, 'samples': 2270016, 'steps': 11822, 'loss/train': 1.7589327096939087} +11/06/2021 22:53:03 - INFO - __main__ - Step 11824: {'lr': 0.0004945849740541265, 'samples': 2270208, 'steps': 11823, 'loss/train': 1.8017772436141968} +11/06/2021 22:53:03 - INFO - __main__ - Step 11825: {'lr': 0.000494583875476699, 'samples': 2270400, 'steps': 11824, 'loss/train': 1.8388363122940063} +11/06/2021 22:53:03 - INFO - __main__ - Step 11826: {'lr': 0.0004945827767890657, 'samples': 2270592, 'steps': 11825, 'loss/train': 1.1017407178878784} +11/06/2021 22:53:04 - INFO - __main__ - Step 11827: {'lr': 0.0004945816779912272, 'samples': 2270784, 'steps': 11826, 'loss/train': 1.1215801239013672} +11/06/2021 22:53:05 - INFO - __main__ - Step 11828: {'lr': 0.000494580579083184, 'samples': 2270976, 'steps': 11827, 'loss/train': 1.8502867221832275} +11/06/2021 22:53:05 - INFO - __main__ - Step 11829: {'lr': 0.0004945794800649366, 'samples': 2271168, 'steps': 11828, 'loss/train': 1.7619470357894897} +11/06/2021 22:53:06 - INFO - __main__ - Step 11830: {'lr': 0.0004945783809364853, 'samples': 2271360, 'steps': 11829, 'loss/train': 1.7739301919937134} +11/06/2021 22:53:06 - INFO - __main__ - Step 11831: {'lr': 0.0004945772816978309, 'samples': 2271552, 'steps': 11830, 'loss/train': 1.8250958919525146} +11/06/2021 22:53:06 - INFO - __main__ - Step 11832: {'lr': 0.0004945761823489737, 'samples': 2271744, 'steps': 11831, 'loss/train': 2.298485040664673} +11/06/2021 22:53:07 - INFO - __main__ - Step 11833: {'lr': 0.0004945750828899144, 'samples': 2271936, 'steps': 11832, 'loss/train': 1.6959924697875977} +11/06/2021 22:53:08 - INFO - __main__ - Step 11834: {'lr': 0.0004945739833206531, 'samples': 2272128, 'steps': 11833, 'loss/train': 1.4420230388641357} +11/06/2021 22:53:08 - INFO - __main__ - Step 11835: {'lr': 0.0004945728836411907, 'samples': 2272320, 'steps': 11834, 'loss/train': 1.9085041284561157} +11/06/2021 22:53:08 - INFO - __main__ - Step 11836: {'lr': 0.0004945717838515275, 'samples': 2272512, 'steps': 11835, 'loss/train': 1.7910774946212769} +11/06/2021 22:53:09 - INFO - __main__ - Step 11837: {'lr': 0.0004945706839516639, 'samples': 2272704, 'steps': 11836, 'loss/train': 0.9751549363136292} +11/06/2021 22:53:10 - INFO - __main__ - Step 11838: {'lr': 0.0004945695839416006, 'samples': 2272896, 'steps': 11837, 'loss/train': 1.1652768850326538} +11/06/2021 22:53:10 - INFO - __main__ - Step 11839: {'lr': 0.0004945684838213382, 'samples': 2273088, 'steps': 11838, 'loss/train': 2.4562861919403076} +11/06/2021 22:53:10 - INFO - __main__ - Step 11840: {'lr': 0.0004945673835908767, 'samples': 2273280, 'steps': 11839, 'loss/train': 1.785056233406067} +11/06/2021 22:53:11 - INFO - __main__ - Step 11841: {'lr': 0.0004945662832502171, 'samples': 2273472, 'steps': 11840, 'loss/train': 1.478073000907898} +11/06/2021 22:53:11 - INFO - __main__ - Step 11842: {'lr': 0.0004945651827993597, 'samples': 2273664, 'steps': 11841, 'loss/train': 1.5558642148971558} +11/06/2021 22:53:11 - INFO - __main__ - Step 11843: {'lr': 0.000494564082238305, 'samples': 2273856, 'steps': 11842, 'loss/train': 1.5626791715621948} +11/06/2021 22:53:13 - INFO - __main__ - Step 11844: {'lr': 0.0004945629815670535, 'samples': 2274048, 'steps': 11843, 'loss/train': 1.923411250114441} +11/06/2021 22:53:13 - INFO - __main__ - Step 11845: {'lr': 0.0004945618807856056, 'samples': 2274240, 'steps': 11844, 'loss/train': 1.2191367149353027} +11/06/2021 22:53:13 - INFO - __main__ - Step 11846: {'lr': 0.000494560779893962, 'samples': 2274432, 'steps': 11845, 'loss/train': 1.695072054862976} +11/06/2021 22:53:14 - INFO - __main__ - Step 11847: {'lr': 0.0004945596788921231, 'samples': 2274624, 'steps': 11846, 'loss/train': 1.8576159477233887} +11/06/2021 22:53:14 - INFO - __main__ - Step 11848: {'lr': 0.0004945585777800893, 'samples': 2274816, 'steps': 11847, 'loss/train': 1.8127880096435547} +11/06/2021 22:53:15 - INFO - __main__ - Step 11849: {'lr': 0.0004945574765578612, 'samples': 2275008, 'steps': 11848, 'loss/train': 1.4972808361053467} +11/06/2021 22:53:15 - INFO - __main__ - Step 11850: {'lr': 0.0004945563752254393, 'samples': 2275200, 'steps': 11849, 'loss/train': 1.7864632606506348} +11/06/2021 22:53:16 - INFO - __main__ - Step 11851: {'lr': 0.000494555273782824, 'samples': 2275392, 'steps': 11850, 'loss/train': 1.0610276460647583} +11/06/2021 22:53:16 - INFO - __main__ - Step 11852: {'lr': 0.000494554172230016, 'samples': 2275584, 'steps': 11851, 'loss/train': 1.3797191381454468} +11/06/2021 22:53:16 - INFO - __main__ - Step 11853: {'lr': 0.0004945530705670156, 'samples': 2275776, 'steps': 11852, 'loss/train': 1.7779545783996582} +11/06/2021 22:53:18 - INFO - __main__ - Step 11854: {'lr': 0.0004945519687938234, 'samples': 2275968, 'steps': 11853, 'loss/train': 1.6782175302505493} +11/06/2021 22:53:18 - INFO - __main__ - Step 11855: {'lr': 0.0004945508669104397, 'samples': 2276160, 'steps': 11854, 'loss/train': 2.7653017044067383} +11/06/2021 22:53:18 - INFO - __main__ - Step 11856: {'lr': 0.0004945497649168654, 'samples': 2276352, 'steps': 11855, 'loss/train': 1.727919340133667} +11/06/2021 22:53:19 - INFO - __main__ - Step 11857: {'lr': 0.0004945486628131006, 'samples': 2276544, 'steps': 11856, 'loss/train': 1.342666506767273} +11/06/2021 22:53:19 - INFO - __main__ - Step 11858: {'lr': 0.0004945475605991459, 'samples': 2276736, 'steps': 11857, 'loss/train': 0.3159283399581909} +11/06/2021 22:53:20 - INFO - __main__ - Step 11859: {'lr': 0.0004945464582750019, 'samples': 2276928, 'steps': 11858, 'loss/train': 1.7237508296966553} +11/06/2021 22:53:20 - INFO - __main__ - Step 11860: {'lr': 0.000494545355840669, 'samples': 2277120, 'steps': 11859, 'loss/train': 1.4004329442977905} +11/06/2021 22:53:21 - INFO - __main__ - Step 11861: {'lr': 0.0004945442532961478, 'samples': 2277312, 'steps': 11860, 'loss/train': 1.3610728979110718} +11/06/2021 22:53:21 - INFO - __main__ - Step 11862: {'lr': 0.0004945431506414386, 'samples': 2277504, 'steps': 11861, 'loss/train': 2.1039764881134033} +11/06/2021 22:53:21 - INFO - __main__ - Step 11863: {'lr': 0.0004945420478765422, 'samples': 2277696, 'steps': 11862, 'loss/train': 2.395843505859375} +11/06/2021 22:53:22 - INFO - __main__ - Step 11864: {'lr': 0.0004945409450014588, 'samples': 2277888, 'steps': 11863, 'loss/train': 1.4284261465072632} +11/06/2021 22:53:23 - INFO - __main__ - Step 11865: {'lr': 0.0004945398420161892, 'samples': 2278080, 'steps': 11864, 'loss/train': 1.9594630002975464} +11/06/2021 22:53:23 - INFO - __main__ - Step 11866: {'lr': 0.0004945387389207335, 'samples': 2278272, 'steps': 11865, 'loss/train': 1.446509599685669} +11/06/2021 22:53:23 - INFO - __main__ - Step 11867: {'lr': 0.0004945376357150926, 'samples': 2278464, 'steps': 11866, 'loss/train': 1.6203410625457764} +11/06/2021 22:53:24 - INFO - __main__ - Step 11868: {'lr': 0.0004945365323992668, 'samples': 2278656, 'steps': 11867, 'loss/train': 1.354360818862915} +11/06/2021 22:53:24 - INFO - __main__ - Step 11869: {'lr': 0.0004945354289732565, 'samples': 2278848, 'steps': 11868, 'loss/train': 1.6801567077636719} +11/06/2021 22:53:25 - INFO - __main__ - Step 11870: {'lr': 0.0004945343254370623, 'samples': 2279040, 'steps': 11869, 'loss/train': 1.8512502908706665} +11/06/2021 22:53:26 - INFO - __main__ - Step 11871: {'lr': 0.0004945332217906848, 'samples': 2279232, 'steps': 11870, 'loss/train': 1.6721792221069336} +11/06/2021 22:53:26 - INFO - __main__ - Step 11872: {'lr': 0.0004945321180341244, 'samples': 2279424, 'steps': 11871, 'loss/train': 1.7960259914398193} +11/06/2021 22:53:26 - INFO - __main__ - Step 11873: {'lr': 0.0004945310141673816, 'samples': 2279616, 'steps': 11872, 'loss/train': 1.7067826986312866} +11/06/2021 22:53:27 - INFO - __main__ - Step 11874: {'lr': 0.0004945299101904568, 'samples': 2279808, 'steps': 11873, 'loss/train': 1.8478683233261108} +11/06/2021 22:53:28 - INFO - __main__ - Step 11875: {'lr': 0.0004945288061033507, 'samples': 2280000, 'steps': 11874, 'loss/train': 1.8449006080627441} +11/06/2021 22:53:28 - INFO - __main__ - Step 11876: {'lr': 0.0004945277019060637, 'samples': 2280192, 'steps': 11875, 'loss/train': 1.7363343238830566} +11/06/2021 22:53:28 - INFO - __main__ - Step 11877: {'lr': 0.0004945265975985962, 'samples': 2280384, 'steps': 11876, 'loss/train': 1.287642478942871} +11/06/2021 22:53:29 - INFO - __main__ - Step 11878: {'lr': 0.0004945254931809489, 'samples': 2280576, 'steps': 11877, 'loss/train': 1.5857558250427246} +11/06/2021 22:53:29 - INFO - __main__ - Step 11879: {'lr': 0.000494524388653122, 'samples': 2280768, 'steps': 11878, 'loss/train': 1.3704111576080322} +11/06/2021 22:53:30 - INFO - __main__ - Step 11880: {'lr': 0.0004945232840151164, 'samples': 2280960, 'steps': 11879, 'loss/train': 1.9039316177368164} +11/06/2021 22:53:31 - INFO - __main__ - Step 11881: {'lr': 0.0004945221792669322, 'samples': 2281152, 'steps': 11880, 'loss/train': 1.6828198432922363} +11/06/2021 22:53:31 - INFO - __main__ - Step 11882: {'lr': 0.0004945210744085702, 'samples': 2281344, 'steps': 11881, 'loss/train': 2.2412431240081787} +11/06/2021 22:53:31 - INFO - __main__ - Step 11883: {'lr': 0.0004945199694400308, 'samples': 2281536, 'steps': 11882, 'loss/train': 1.4356671571731567} +11/06/2021 22:53:32 - INFO - __main__ - Step 11884: {'lr': 0.0004945188643613144, 'samples': 2281728, 'steps': 11883, 'loss/train': 1.609714388847351} +11/06/2021 22:53:33 - INFO - __main__ - Step 11885: {'lr': 0.0004945177591724216, 'samples': 2281920, 'steps': 11884, 'loss/train': 1.3597244024276733} +11/06/2021 22:53:33 - INFO - __main__ - Step 11886: {'lr': 0.0004945166538733529, 'samples': 2282112, 'steps': 11885, 'loss/train': 1.8882817029953003} +11/06/2021 22:53:33 - INFO - __main__ - Step 11887: {'lr': 0.0004945155484641087, 'samples': 2282304, 'steps': 11886, 'loss/train': 1.242563009262085} +11/06/2021 22:53:34 - INFO - __main__ - Step 11888: {'lr': 0.0004945144429446897, 'samples': 2282496, 'steps': 11887, 'loss/train': 1.8521512746810913} +11/06/2021 22:53:34 - INFO - __main__ - Step 11889: {'lr': 0.000494513337315096, 'samples': 2282688, 'steps': 11888, 'loss/train': 1.7061456441879272} +11/06/2021 22:53:35 - INFO - __main__ - Step 11890: {'lr': 0.0004945122315753286, 'samples': 2282880, 'steps': 11889, 'loss/train': 1.742601990699768} +11/06/2021 22:53:35 - INFO - __main__ - Step 11891: {'lr': 0.0004945111257253877, 'samples': 2283072, 'steps': 11890, 'loss/train': 1.7886587381362915} +11/06/2021 22:53:36 - INFO - __main__ - Step 11892: {'lr': 0.0004945100197652738, 'samples': 2283264, 'steps': 11891, 'loss/train': 2.3092379570007324} +11/06/2021 22:53:36 - INFO - __main__ - Step 11893: {'lr': 0.0004945089136949876, 'samples': 2283456, 'steps': 11892, 'loss/train': 1.7748466730117798} +11/06/2021 22:53:37 - INFO - __main__ - Step 11894: {'lr': 0.0004945078075145292, 'samples': 2283648, 'steps': 11893, 'loss/train': 2.0001227855682373} +11/06/2021 22:53:37 - INFO - __main__ - Step 11895: {'lr': 0.0004945067012238996, 'samples': 2283840, 'steps': 11894, 'loss/train': 1.475651502609253} +11/06/2021 22:53:38 - INFO - __main__ - Step 11896: {'lr': 0.000494505594823099, 'samples': 2284032, 'steps': 11895, 'loss/train': 0.5591633915901184} +11/06/2021 22:53:38 - INFO - __main__ - Step 11897: {'lr': 0.0004945044883121279, 'samples': 2284224, 'steps': 11896, 'loss/train': 1.6657626628875732} +11/06/2021 22:53:39 - INFO - __main__ - Step 11898: {'lr': 0.0004945033816909868, 'samples': 2284416, 'steps': 11897, 'loss/train': 1.5739197731018066} +11/06/2021 22:53:39 - INFO - __main__ - Step 11899: {'lr': 0.0004945022749596764, 'samples': 2284608, 'steps': 11898, 'loss/train': 1.6990892887115479} +11/06/2021 22:53:39 - INFO - __main__ - Step 11900: {'lr': 0.000494501168118197, 'samples': 2284800, 'steps': 11899, 'loss/train': 1.785287618637085} +11/06/2021 22:53:40 - INFO - __main__ - Step 11901: {'lr': 0.0004945000611665491, 'samples': 2284992, 'steps': 11900, 'loss/train': 1.6788626909255981} +11/06/2021 22:53:41 - INFO - __main__ - Step 11902: {'lr': 0.0004944989541047333, 'samples': 2285184, 'steps': 11901, 'loss/train': 1.9078575372695923} +11/06/2021 22:53:41 - INFO - __main__ - Step 11903: {'lr': 0.0004944978469327499, 'samples': 2285376, 'steps': 11902, 'loss/train': 1.8978601694107056} +11/06/2021 22:53:41 - INFO - __main__ - Step 11904: {'lr': 0.0004944967396505998, 'samples': 2285568, 'steps': 11903, 'loss/train': 1.5183367729187012} +11/06/2021 22:53:42 - INFO - __main__ - Step 11905: {'lr': 0.000494495632258283, 'samples': 2285760, 'steps': 11904, 'loss/train': 1.6283320188522339} +11/06/2021 22:53:43 - INFO - __main__ - Step 11906: {'lr': 0.0004944945247558004, 'samples': 2285952, 'steps': 11905, 'loss/train': 1.0076183080673218} +11/06/2021 22:53:43 - INFO - __main__ - Step 11907: {'lr': 0.0004944934171431522, 'samples': 2286144, 'steps': 11906, 'loss/train': 1.794429898262024} +11/06/2021 22:53:43 - INFO - __main__ - Step 11908: {'lr': 0.0004944923094203391, 'samples': 2286336, 'steps': 11907, 'loss/train': 1.9065196514129639} +11/06/2021 22:53:44 - INFO - __main__ - Step 11909: {'lr': 0.0004944912015873616, 'samples': 2286528, 'steps': 11908, 'loss/train': 1.092329740524292} +11/06/2021 22:53:44 - INFO - __main__ - Step 11910: {'lr': 0.0004944900936442201, 'samples': 2286720, 'steps': 11909, 'loss/train': 1.7471907138824463} +11/06/2021 22:53:45 - INFO - __main__ - Step 11911: {'lr': 0.000494488985590915, 'samples': 2286912, 'steps': 11910, 'loss/train': 2.4433507919311523} +11/06/2021 22:53:46 - INFO - __main__ - Step 11912: {'lr': 0.0004944878774274472, 'samples': 2287104, 'steps': 11911, 'loss/train': 1.9557836055755615} +11/06/2021 22:53:46 - INFO - __main__ - Step 11913: {'lr': 0.0004944867691538167, 'samples': 2287296, 'steps': 11912, 'loss/train': 1.8252263069152832} +11/06/2021 22:53:46 - INFO - __main__ - Step 11914: {'lr': 0.0004944856607700243, 'samples': 2287488, 'steps': 11913, 'loss/train': 1.3514317274093628} +11/06/2021 22:53:47 - INFO - __main__ - Step 11915: {'lr': 0.0004944845522760706, 'samples': 2287680, 'steps': 11914, 'loss/train': 1.4288444519042969} +11/06/2021 22:53:47 - INFO - __main__ - Step 11916: {'lr': 0.0004944834436719557, 'samples': 2287872, 'steps': 11915, 'loss/train': 1.7817126512527466} +11/06/2021 22:53:48 - INFO - __main__ - Step 11917: {'lr': 0.0004944823349576805, 'samples': 2288064, 'steps': 11916, 'loss/train': 0.9959566593170166} +11/06/2021 22:53:48 - INFO - __main__ - Step 11918: {'lr': 0.0004944812261332452, 'samples': 2288256, 'steps': 11917, 'loss/train': 1.2782503366470337} +11/06/2021 22:53:49 - INFO - __main__ - Step 11919: {'lr': 0.0004944801171986505, 'samples': 2288448, 'steps': 11918, 'loss/train': 1.4812965393066406} +11/06/2021 22:53:49 - INFO - __main__ - Step 11920: {'lr': 0.0004944790081538969, 'samples': 2288640, 'steps': 11919, 'loss/train': 1.7780016660690308} +11/06/2021 22:53:49 - INFO - __main__ - Step 11921: {'lr': 0.0004944778989989847, 'samples': 2288832, 'steps': 11920, 'loss/train': 2.459728240966797} +11/06/2021 22:53:50 - INFO - __main__ - Step 11922: {'lr': 0.0004944767897339146, 'samples': 2289024, 'steps': 11921, 'loss/train': 1.5695812702178955} +11/06/2021 22:53:51 - INFO - __main__ - Step 11923: {'lr': 0.000494475680358687, 'samples': 2289216, 'steps': 11922, 'loss/train': 1.9413129091262817} +11/06/2021 22:53:51 - INFO - __main__ - Step 11924: {'lr': 0.0004944745708733025, 'samples': 2289408, 'steps': 11923, 'loss/train': 2.0285587310791016} +11/06/2021 22:53:52 - INFO - __main__ - Step 11925: {'lr': 0.0004944734612777615, 'samples': 2289600, 'steps': 11924, 'loss/train': 1.9409503936767578} +11/06/2021 22:53:52 - INFO - __main__ - Step 11926: {'lr': 0.0004944723515720645, 'samples': 2289792, 'steps': 11925, 'loss/train': 1.747592806816101} +11/06/2021 22:53:53 - INFO - __main__ - Step 11927: {'lr': 0.000494471241756212, 'samples': 2289984, 'steps': 11926, 'loss/train': 1.674291729927063} +11/06/2021 22:53:53 - INFO - __main__ - Step 11928: {'lr': 0.0004944701318302046, 'samples': 2290176, 'steps': 11927, 'loss/train': 1.5972325801849365} +11/06/2021 22:53:54 - INFO - __main__ - Step 11929: {'lr': 0.0004944690217940427, 'samples': 2290368, 'steps': 11928, 'loss/train': 1.5960736274719238} +11/06/2021 22:53:54 - INFO - __main__ - Step 11930: {'lr': 0.0004944679116477269, 'samples': 2290560, 'steps': 11929, 'loss/train': 1.5236477851867676} +11/06/2021 22:53:54 - INFO - __main__ - Step 11931: {'lr': 0.0004944668013912575, 'samples': 2290752, 'steps': 11930, 'loss/train': 1.5838426351547241} +11/06/2021 22:53:55 - INFO - __main__ - Step 11932: {'lr': 0.0004944656910246352, 'samples': 2290944, 'steps': 11931, 'loss/train': 1.651598572731018} +11/06/2021 22:53:56 - INFO - __main__ - Step 11933: {'lr': 0.0004944645805478605, 'samples': 2291136, 'steps': 11932, 'loss/train': 1.3770673274993896} +11/06/2021 22:53:56 - INFO - __main__ - Step 11934: {'lr': 0.0004944634699609338, 'samples': 2291328, 'steps': 11933, 'loss/train': 2.044022560119629} +11/06/2021 22:53:56 - INFO - __main__ - Step 11935: {'lr': 0.0004944623592638555, 'samples': 2291520, 'steps': 11934, 'loss/train': 1.4433174133300781} +11/06/2021 22:53:57 - INFO - __main__ - Step 11936: {'lr': 0.0004944612484566263, 'samples': 2291712, 'steps': 11935, 'loss/train': 1.43559730052948} +11/06/2021 22:53:57 - INFO - __main__ - Step 11937: {'lr': 0.0004944601375392467, 'samples': 2291904, 'steps': 11936, 'loss/train': 2.0127391815185547} +11/06/2021 22:53:58 - INFO - __main__ - Step 11938: {'lr': 0.000494459026511717, 'samples': 2292096, 'steps': 11937, 'loss/train': 1.7522636651992798} +11/06/2021 22:53:59 - INFO - __main__ - Step 11939: {'lr': 0.000494457915374038, 'samples': 2292288, 'steps': 11938, 'loss/train': 1.910089373588562} +11/06/2021 22:53:59 - INFO - __main__ - Step 11940: {'lr': 0.00049445680412621, 'samples': 2292480, 'steps': 11939, 'loss/train': 1.6067532300949097} +11/06/2021 22:53:59 - INFO - __main__ - Step 11941: {'lr': 0.0004944556927682335, 'samples': 2292672, 'steps': 11940, 'loss/train': 1.7804417610168457} +11/06/2021 22:54:00 - INFO - __main__ - Step 11942: {'lr': 0.000494454581300109, 'samples': 2292864, 'steps': 11941, 'loss/train': 1.387055516242981} +11/06/2021 22:54:00 - INFO - __main__ - Step 11943: {'lr': 0.0004944534697218371, 'samples': 2293056, 'steps': 11942, 'loss/train': 1.4685114622116089} +11/06/2021 22:54:01 - INFO - __main__ - Step 11944: {'lr': 0.0004944523580334183, 'samples': 2293248, 'steps': 11943, 'loss/train': 0.5896292924880981} +11/06/2021 22:54:01 - INFO - __main__ - Step 11945: {'lr': 0.0004944512462348528, 'samples': 2293440, 'steps': 11944, 'loss/train': 1.9006822109222412} +11/06/2021 22:54:02 - INFO - __main__ - Step 11946: {'lr': 0.0004944501343261416, 'samples': 2293632, 'steps': 11945, 'loss/train': 1.7416223287582397} +11/06/2021 22:54:02 - INFO - __main__ - Step 11947: {'lr': 0.0004944490223072848, 'samples': 2293824, 'steps': 11946, 'loss/train': 0.48262572288513184} +11/06/2021 22:54:03 - INFO - __main__ - Step 11948: {'lr': 0.0004944479101782831, 'samples': 2294016, 'steps': 11947, 'loss/train': 1.9362751245498657} +11/06/2021 22:54:03 - INFO - __main__ - Step 11949: {'lr': 0.0004944467979391369, 'samples': 2294208, 'steps': 11948, 'loss/train': 1.4246046543121338} +11/06/2021 22:54:04 - INFO - __main__ - Step 11950: {'lr': 0.0004944456855898469, 'samples': 2294400, 'steps': 11949, 'loss/train': 1.5375300645828247} +11/06/2021 22:54:04 - INFO - __main__ - Step 11951: {'lr': 0.0004944445731304133, 'samples': 2294592, 'steps': 11950, 'loss/train': 2.0238983631134033} +11/06/2021 22:54:04 - INFO - __main__ - Step 11952: {'lr': 0.0004944434605608367, 'samples': 2294784, 'steps': 11951, 'loss/train': 1.2838270664215088} +11/06/2021 22:54:05 - INFO - __main__ - Step 11953: {'lr': 0.0004944423478811177, 'samples': 2294976, 'steps': 11952, 'loss/train': 1.7840559482574463} +11/06/2021 22:54:06 - INFO - __main__ - Step 11954: {'lr': 0.0004944412350912567, 'samples': 2295168, 'steps': 11953, 'loss/train': 1.7490830421447754} +11/06/2021 22:54:06 - INFO - __main__ - Step 11955: {'lr': 0.0004944401221912544, 'samples': 2295360, 'steps': 11954, 'loss/train': 1.8949376344680786} +11/06/2021 22:54:06 - INFO - __main__ - Step 11956: {'lr': 0.0004944390091811111, 'samples': 2295552, 'steps': 11955, 'loss/train': 1.7346197366714478} +11/06/2021 22:54:07 - INFO - __main__ - Step 11957: {'lr': 0.0004944378960608272, 'samples': 2295744, 'steps': 11956, 'loss/train': 1.9037965536117554} +11/06/2021 22:54:07 - INFO - __main__ - Step 11958: {'lr': 0.0004944367828304035, 'samples': 2295936, 'steps': 11957, 'loss/train': 1.8399511575698853} +11/06/2021 22:54:08 - INFO - __main__ - Step 11959: {'lr': 0.0004944356694898404, 'samples': 2296128, 'steps': 11958, 'loss/train': 0.14074699580669403} +11/06/2021 22:54:09 - INFO - __main__ - Step 11960: {'lr': 0.0004944345560391382, 'samples': 2296320, 'steps': 11959, 'loss/train': 1.9995806217193604} +11/06/2021 22:54:09 - INFO - __main__ - Step 11961: {'lr': 0.0004944334424782977, 'samples': 2296512, 'steps': 11960, 'loss/train': 1.5391980409622192} +11/06/2021 22:54:09 - INFO - __main__ - Step 11962: {'lr': 0.0004944323288073192, 'samples': 2296704, 'steps': 11961, 'loss/train': 1.4151784181594849} +11/06/2021 22:54:10 - INFO - __main__ - Step 11963: {'lr': 0.0004944312150262033, 'samples': 2296896, 'steps': 11962, 'loss/train': 1.0756903886795044} +11/06/2021 22:54:11 - INFO - __main__ - Step 11964: {'lr': 0.0004944301011349505, 'samples': 2297088, 'steps': 11963, 'loss/train': 1.644909143447876} +11/06/2021 22:54:11 - INFO - __main__ - Step 11965: {'lr': 0.0004944289871335612, 'samples': 2297280, 'steps': 11964, 'loss/train': 2.0946547985076904} +11/06/2021 22:54:11 - INFO - __main__ - Step 11966: {'lr': 0.0004944278730220359, 'samples': 2297472, 'steps': 11965, 'loss/train': 1.4997888803482056} +11/06/2021 22:54:12 - INFO - __main__ - Step 11967: {'lr': 0.0004944267588003754, 'samples': 2297664, 'steps': 11966, 'loss/train': 1.587903618812561} +11/06/2021 22:54:12 - INFO - __main__ - Step 11968: {'lr': 0.0004944256444685798, 'samples': 2297856, 'steps': 11967, 'loss/train': 1.6351916790008545} +11/06/2021 22:54:13 - INFO - __main__ - Step 11969: {'lr': 0.0004944245300266498, 'samples': 2298048, 'steps': 11968, 'loss/train': 1.4442037343978882} +11/06/2021 22:54:13 - INFO - __main__ - Step 11970: {'lr': 0.0004944234154745859, 'samples': 2298240, 'steps': 11969, 'loss/train': 1.8854682445526123} +11/06/2021 22:54:14 - INFO - __main__ - Step 11971: {'lr': 0.0004944223008123886, 'samples': 2298432, 'steps': 11970, 'loss/train': 1.832446813583374} +11/06/2021 22:54:14 - INFO - __main__ - Step 11972: {'lr': 0.0004944211860400582, 'samples': 2298624, 'steps': 11971, 'loss/train': 1.448323130607605} +11/06/2021 22:54:15 - INFO - __main__ - Step 11973: {'lr': 0.0004944200711575956, 'samples': 2298816, 'steps': 11972, 'loss/train': 1.9672355651855469} +11/06/2021 22:54:16 - INFO - __main__ - Step 11974: {'lr': 0.0004944189561650011, 'samples': 2299008, 'steps': 11973, 'loss/train': 1.4000511169433594} +11/06/2021 22:54:16 - INFO - __main__ - Step 11975: {'lr': 0.0004944178410622751, 'samples': 2299200, 'steps': 11974, 'loss/train': 1.234156847000122} +11/06/2021 22:54:17 - INFO - __main__ - Step 11976: {'lr': 0.0004944167258494181, 'samples': 2299392, 'steps': 11975, 'loss/train': 1.449386477470398} +11/06/2021 22:54:17 - INFO - __main__ - Step 11977: {'lr': 0.0004944156105264308, 'samples': 2299584, 'steps': 11976, 'loss/train': 0.3471572995185852} +11/06/2021 22:54:17 - INFO - __main__ - Step 11978: {'lr': 0.0004944144950933137, 'samples': 2299776, 'steps': 11977, 'loss/train': 1.291796088218689} +11/06/2021 22:54:18 - INFO - __main__ - Step 11979: {'lr': 0.000494413379550067, 'samples': 2299968, 'steps': 11978, 'loss/train': 1.4064840078353882} +11/06/2021 22:54:19 - INFO - __main__ - Step 11980: {'lr': 0.0004944122638966916, 'samples': 2300160, 'steps': 11979, 'loss/train': 2.1589348316192627} +11/06/2021 22:54:19 - INFO - __main__ - Step 11981: {'lr': 0.0004944111481331876, 'samples': 2300352, 'steps': 11980, 'loss/train': 2.178071975708008} +11/06/2021 22:54:19 - INFO - __main__ - Step 11982: {'lr': 0.0004944100322595558, 'samples': 2300544, 'steps': 11981, 'loss/train': 1.5777186155319214} +11/06/2021 22:54:20 - INFO - __main__ - Step 11983: {'lr': 0.0004944089162757968, 'samples': 2300736, 'steps': 11982, 'loss/train': 1.8397846221923828} +11/06/2021 22:54:21 - INFO - __main__ - Step 11984: {'lr': 0.0004944078001819106, 'samples': 2300928, 'steps': 11983, 'loss/train': 1.9047267436981201} +11/06/2021 22:54:21 - INFO - __main__ - Step 11985: {'lr': 0.0004944066839778983, 'samples': 2301120, 'steps': 11984, 'loss/train': 1.7153035402297974} +11/06/2021 22:54:21 - INFO - __main__ - Step 11986: {'lr': 0.0004944055676637599, 'samples': 2301312, 'steps': 11985, 'loss/train': 1.4917117357254028} +11/06/2021 22:54:22 - INFO - __main__ - Step 11987: {'lr': 0.0004944044512394962, 'samples': 2301504, 'steps': 11986, 'loss/train': 1.906925916671753} +11/06/2021 22:54:22 - INFO - __main__ - Step 11988: {'lr': 0.0004944033347051076, 'samples': 2301696, 'steps': 11987, 'loss/train': 1.9712414741516113} +11/06/2021 22:54:23 - INFO - __main__ - Step 11989: {'lr': 0.0004944022180605947, 'samples': 2301888, 'steps': 11988, 'loss/train': 1.898970127105713} +11/06/2021 22:54:24 - INFO - __main__ - Step 11990: {'lr': 0.0004944011013059579, 'samples': 2302080, 'steps': 11989, 'loss/train': 1.1535645723342896} +11/06/2021 22:54:24 - INFO - __main__ - Step 11991: {'lr': 0.0004943999844411977, 'samples': 2302272, 'steps': 11990, 'loss/train': 1.2547049522399902} +11/06/2021 22:54:24 - INFO - __main__ - Step 11992: {'lr': 0.0004943988674663147, 'samples': 2302464, 'steps': 11991, 'loss/train': 1.8330069780349731} +11/06/2021 22:54:25 - INFO - __main__ - Step 11993: {'lr': 0.0004943977503813092, 'samples': 2302656, 'steps': 11992, 'loss/train': 1.3840059041976929} +11/06/2021 22:54:25 - INFO - __main__ - Step 11994: {'lr': 0.000494396633186182, 'samples': 2302848, 'steps': 11993, 'loss/train': 2.0180881023406982} +11/06/2021 22:54:26 - INFO - __main__ - Step 11995: {'lr': 0.0004943955158809334, 'samples': 2303040, 'steps': 11994, 'loss/train': 1.7665796279907227} +11/06/2021 22:54:26 - INFO - __main__ - Step 11996: {'lr': 0.0004943943984655639, 'samples': 2303232, 'steps': 11995, 'loss/train': 1.3726966381072998} +11/06/2021 22:54:27 - INFO - __main__ - Step 11997: {'lr': 0.0004943932809400741, 'samples': 2303424, 'steps': 11996, 'loss/train': 1.9251682758331299} +11/06/2021 22:54:27 - INFO - __main__ - Step 11998: {'lr': 0.0004943921633044644, 'samples': 2303616, 'steps': 11997, 'loss/train': 1.752882480621338} +11/06/2021 22:54:27 - INFO - __main__ - Step 11999: {'lr': 0.0004943910455587354, 'samples': 2303808, 'steps': 11998, 'loss/train': 1.246006727218628} +11/06/2021 22:54:28 - INFO - __main__ - Step 12000: {'lr': 0.0004943899277028877, 'samples': 2304000, 'steps': 11999, 'loss/train': 1.6304447650909424} +11/06/2021 22:54:29 - INFO - __main__ - Step 12001: {'lr': 0.0004943888097369216, 'samples': 2304192, 'steps': 12000, 'loss/train': 1.6695126295089722} +11/06/2021 22:54:29 - INFO - __main__ - Step 12002: {'lr': 0.0004943876916608375, 'samples': 2304384, 'steps': 12001, 'loss/train': 1.794386625289917} +11/06/2021 22:54:29 - INFO - __main__ - Step 12003: {'lr': 0.0004943865734746364, 'samples': 2304576, 'steps': 12002, 'loss/train': 1.8876904249191284} +11/06/2021 22:54:30 - INFO - __main__ - Step 12004: {'lr': 0.0004943854551783182, 'samples': 2304768, 'steps': 12003, 'loss/train': 1.6697297096252441} +11/06/2021 22:54:31 - INFO - __main__ - Step 12005: {'lr': 0.0004943843367718838, 'samples': 2304960, 'steps': 12004, 'loss/train': 1.6420907974243164} +11/06/2021 22:54:31 - INFO - __main__ - Step 12006: {'lr': 0.0004943832182553336, 'samples': 2305152, 'steps': 12005, 'loss/train': 1.553113341331482} +11/06/2021 22:54:32 - INFO - __main__ - Step 12007: {'lr': 0.000494382099628668, 'samples': 2305344, 'steps': 12006, 'loss/train': 2.0208699703216553} +11/06/2021 22:54:32 - INFO - __main__ - Step 12008: {'lr': 0.0004943809808918877, 'samples': 2305536, 'steps': 12007, 'loss/train': 1.575126051902771} +11/06/2021 22:54:32 - INFO - __main__ - Step 12009: {'lr': 0.000494379862044993, 'samples': 2305728, 'steps': 12008, 'loss/train': 1.9213340282440186} +11/06/2021 22:54:33 - INFO - __main__ - Step 12010: {'lr': 0.0004943787430879846, 'samples': 2305920, 'steps': 12009, 'loss/train': 1.99528169631958} +11/06/2021 22:54:34 - INFO - __main__ - Step 12011: {'lr': 0.0004943776240208628, 'samples': 2306112, 'steps': 12010, 'loss/train': 1.7493822574615479} +11/06/2021 22:54:34 - INFO - __main__ - Step 12012: {'lr': 0.0004943765048436283, 'samples': 2306304, 'steps': 12011, 'loss/train': 1.5333633422851562} +11/06/2021 22:54:34 - INFO - __main__ - Step 12013: {'lr': 0.0004943753855562815, 'samples': 2306496, 'steps': 12012, 'loss/train': 1.6219375133514404} +11/06/2021 22:54:35 - INFO - __main__ - Step 12014: {'lr': 0.000494374266158823, 'samples': 2306688, 'steps': 12013, 'loss/train': 1.9051744937896729} +11/06/2021 22:54:36 - INFO - __main__ - Step 12015: {'lr': 0.0004943731466512531, 'samples': 2306880, 'steps': 12014, 'loss/train': 1.5404677391052246} +11/06/2021 22:54:37 - INFO - __main__ - Step 12016: {'lr': 0.0004943720270335724, 'samples': 2307072, 'steps': 12015, 'loss/train': 1.5498056411743164} +11/06/2021 22:54:37 - INFO - __main__ - Step 12017: {'lr': 0.0004943709073057816, 'samples': 2307264, 'steps': 12016, 'loss/train': 1.53780198097229} +11/06/2021 22:54:37 - INFO - __main__ - Step 12018: {'lr': 0.000494369787467881, 'samples': 2307456, 'steps': 12017, 'loss/train': 1.328963041305542} +11/06/2021 22:54:38 - INFO - __main__ - Step 12019: {'lr': 0.000494368667519871, 'samples': 2307648, 'steps': 12018, 'loss/train': 1.014737844467163} +11/06/2021 22:54:38 - INFO - __main__ - Step 12020: {'lr': 0.0004943675474617524, 'samples': 2307840, 'steps': 12019, 'loss/train': 1.956551432609558} +11/06/2021 22:54:39 - INFO - __main__ - Step 12021: {'lr': 0.0004943664272935255, 'samples': 2308032, 'steps': 12020, 'loss/train': 1.9309561252593994} +11/06/2021 22:54:39 - INFO - __main__ - Step 12022: {'lr': 0.0004943653070151909, 'samples': 2308224, 'steps': 12021, 'loss/train': 1.6873791217803955} +11/06/2021 22:54:40 - INFO - __main__ - Step 12023: {'lr': 0.000494364186626749, 'samples': 2308416, 'steps': 12022, 'loss/train': 0.8956676125526428} +11/06/2021 22:54:40 - INFO - __main__ - Step 12024: {'lr': 0.0004943630661282004, 'samples': 2308608, 'steps': 12023, 'loss/train': 1.492911696434021} +11/06/2021 22:54:40 - INFO - __main__ - Step 12025: {'lr': 0.0004943619455195456, 'samples': 2308800, 'steps': 12024, 'loss/train': 2.243229627609253} +11/06/2021 22:54:41 - INFO - __main__ - Step 12026: {'lr': 0.000494360824800785, 'samples': 2308992, 'steps': 12025, 'loss/train': 2.4765336513519287} +11/06/2021 22:54:42 - INFO - __main__ - Step 12027: {'lr': 0.0004943597039719192, 'samples': 2309184, 'steps': 12026, 'loss/train': 2.0413081645965576} +11/06/2021 22:54:42 - INFO - __main__ - Step 12028: {'lr': 0.0004943585830329487, 'samples': 2309376, 'steps': 12027, 'loss/train': 1.6951693296432495} +11/06/2021 22:54:42 - INFO - __main__ - Step 12029: {'lr': 0.0004943574619838741, 'samples': 2309568, 'steps': 12028, 'loss/train': 1.7877787351608276} +11/06/2021 22:54:43 - INFO - __main__ - Step 12030: {'lr': 0.0004943563408246957, 'samples': 2309760, 'steps': 12029, 'loss/train': 2.547342300415039} +11/06/2021 22:54:44 - INFO - __main__ - Step 12031: {'lr': 0.000494355219555414, 'samples': 2309952, 'steps': 12030, 'loss/train': 1.9224157333374023} +11/06/2021 22:54:44 - INFO - __main__ - Step 12032: {'lr': 0.0004943540981760298, 'samples': 2310144, 'steps': 12031, 'loss/train': 1.732265591621399} +11/06/2021 22:54:45 - INFO - __main__ - Step 12033: {'lr': 0.0004943529766865434, 'samples': 2310336, 'steps': 12032, 'loss/train': 1.4456995725631714} +11/06/2021 22:54:45 - INFO - __main__ - Step 12034: {'lr': 0.0004943518550869552, 'samples': 2310528, 'steps': 12033, 'loss/train': 1.0278202295303345} +11/06/2021 22:54:45 - INFO - __main__ - Step 12035: {'lr': 0.0004943507333772659, 'samples': 2310720, 'steps': 12034, 'loss/train': 1.7194404602050781} +11/06/2021 22:54:46 - INFO - __main__ - Step 12036: {'lr': 0.0004943496115574758, 'samples': 2310912, 'steps': 12035, 'loss/train': 1.838610053062439} +11/06/2021 22:54:47 - INFO - __main__ - Step 12037: {'lr': 0.0004943484896275857, 'samples': 2311104, 'steps': 12036, 'loss/train': 1.8748886585235596} +11/06/2021 22:54:47 - INFO - __main__ - Step 12038: {'lr': 0.0004943473675875959, 'samples': 2311296, 'steps': 12037, 'loss/train': 1.785986304283142} +11/06/2021 22:54:47 - INFO - __main__ - Step 12039: {'lr': 0.0004943462454375069, 'samples': 2311488, 'steps': 12038, 'loss/train': 1.6484863758087158} +11/06/2021 22:54:48 - INFO - __main__ - Step 12040: {'lr': 0.0004943451231773192, 'samples': 2311680, 'steps': 12039, 'loss/train': 1.8287440538406372} +11/06/2021 22:54:48 - INFO - __main__ - Step 12041: {'lr': 0.0004943440008070336, 'samples': 2311872, 'steps': 12040, 'loss/train': 1.2634427547454834} +11/06/2021 22:54:49 - INFO - __main__ - Step 12042: {'lr': 0.0004943428783266502, 'samples': 2312064, 'steps': 12041, 'loss/train': 1.7805235385894775} +11/06/2021 22:54:49 - INFO - __main__ - Step 12043: {'lr': 0.0004943417557361696, 'samples': 2312256, 'steps': 12042, 'loss/train': 1.758927583694458} +11/06/2021 22:54:50 - INFO - __main__ - Step 12044: {'lr': 0.0004943406330355925, 'samples': 2312448, 'steps': 12043, 'loss/train': 1.159117341041565} +11/06/2021 22:54:50 - INFO - __main__ - Step 12045: {'lr': 0.0004943395102249192, 'samples': 2312640, 'steps': 12044, 'loss/train': 1.8468574285507202} +11/06/2021 22:54:51 - INFO - __main__ - Step 12046: {'lr': 0.0004943383873041503, 'samples': 2312832, 'steps': 12045, 'loss/train': 1.8814785480499268} +11/06/2021 22:54:51 - INFO - __main__ - Step 12047: {'lr': 0.0004943372642732864, 'samples': 2313024, 'steps': 12046, 'loss/train': 2.093292236328125} +11/06/2021 22:54:52 - INFO - __main__ - Step 12048: {'lr': 0.0004943361411323277, 'samples': 2313216, 'steps': 12047, 'loss/train': 1.5713038444519043} +11/06/2021 22:54:52 - INFO - __main__ - Step 12049: {'lr': 0.0004943350178812751, 'samples': 2313408, 'steps': 12048, 'loss/train': 1.8695523738861084} +11/06/2021 22:54:52 - INFO - __main__ - Step 12050: {'lr': 0.0004943338945201288, 'samples': 2313600, 'steps': 12049, 'loss/train': 1.4861245155334473} +11/06/2021 22:54:53 - INFO - __main__ - Step 12051: {'lr': 0.0004943327710488894, 'samples': 2313792, 'steps': 12050, 'loss/train': 1.4577797651290894} +11/06/2021 22:54:54 - INFO - __main__ - Step 12052: {'lr': 0.0004943316474675575, 'samples': 2313984, 'steps': 12051, 'loss/train': 1.26167631149292} +11/06/2021 22:54:54 - INFO - __main__ - Step 12053: {'lr': 0.0004943305237761335, 'samples': 2314176, 'steps': 12052, 'loss/train': 1.674010157585144} +11/06/2021 22:54:54 - INFO - __main__ - Step 12054: {'lr': 0.0004943293999746179, 'samples': 2314368, 'steps': 12053, 'loss/train': 1.585003137588501} +11/06/2021 22:54:55 - INFO - __main__ - Step 12055: {'lr': 0.0004943282760630114, 'samples': 2314560, 'steps': 12054, 'loss/train': 1.8338981866836548} +11/06/2021 22:54:56 - INFO - __main__ - Step 12056: {'lr': 0.0004943271520413141, 'samples': 2314752, 'steps': 12055, 'loss/train': 1.6926106214523315} +11/06/2021 22:54:56 - INFO - __main__ - Step 12057: {'lr': 0.0004943260279095269, 'samples': 2314944, 'steps': 12056, 'loss/train': 1.6934748888015747} +11/06/2021 22:54:57 - INFO - __main__ - Step 12058: {'lr': 0.0004943249036676501, 'samples': 2315136, 'steps': 12057, 'loss/train': 1.7814065217971802} +11/06/2021 22:54:57 - INFO - __main__ - Step 12059: {'lr': 0.0004943237793156844, 'samples': 2315328, 'steps': 12058, 'loss/train': 2.4570651054382324} +11/06/2021 22:54:57 - INFO - __main__ - Step 12060: {'lr': 0.00049432265485363, 'samples': 2315520, 'steps': 12059, 'loss/train': 1.1607862710952759} +11/06/2021 22:54:58 - INFO - __main__ - Step 12061: {'lr': 0.0004943215302814877, 'samples': 2315712, 'steps': 12060, 'loss/train': 1.2177666425704956} +11/06/2021 22:54:59 - INFO - __main__ - Step 12062: {'lr': 0.0004943204055992579, 'samples': 2315904, 'steps': 12061, 'loss/train': 1.5392464399337769} +11/06/2021 22:54:59 - INFO - __main__ - Step 12063: {'lr': 0.0004943192808069411, 'samples': 2316096, 'steps': 12062, 'loss/train': 1.2292014360427856} +11/06/2021 22:54:59 - INFO - __main__ - Step 12064: {'lr': 0.0004943181559045378, 'samples': 2316288, 'steps': 12063, 'loss/train': 1.9744259119033813} +11/06/2021 22:55:00 - INFO - __main__ - Step 12065: {'lr': 0.0004943170308920483, 'samples': 2316480, 'steps': 12064, 'loss/train': 1.6766237020492554} +11/06/2021 22:55:00 - INFO - __main__ - Step 12066: {'lr': 0.0004943159057694736, 'samples': 2316672, 'steps': 12065, 'loss/train': 1.6280395984649658} +11/06/2021 22:55:02 - INFO - __main__ - Step 12067: {'lr': 0.0004943147805368138, 'samples': 2316864, 'steps': 12066, 'loss/train': 1.6543623208999634} +11/06/2021 22:55:02 - INFO - __main__ - Step 12068: {'lr': 0.0004943136551940695, 'samples': 2317056, 'steps': 12067, 'loss/train': 1.1795415878295898} +11/06/2021 22:55:02 - INFO - __main__ - Step 12069: {'lr': 0.0004943125297412413, 'samples': 2317248, 'steps': 12068, 'loss/train': 1.8180369138717651} +11/06/2021 22:55:03 - INFO - __main__ - Step 12070: {'lr': 0.0004943114041783296, 'samples': 2317440, 'steps': 12069, 'loss/train': 1.788710355758667} +11/06/2021 22:55:03 - INFO - __main__ - Step 12071: {'lr': 0.000494310278505335, 'samples': 2317632, 'steps': 12070, 'loss/train': 1.761925458908081} +11/06/2021 22:55:03 - INFO - __main__ - Step 12072: {'lr': 0.0004943091527222579, 'samples': 2317824, 'steps': 12071, 'loss/train': 1.7475976943969727} +11/06/2021 22:55:04 - INFO - __main__ - Step 12073: {'lr': 0.0004943080268290989, 'samples': 2318016, 'steps': 12072, 'loss/train': 1.6183298826217651} +11/06/2021 22:55:05 - INFO - __main__ - Step 12074: {'lr': 0.0004943069008258584, 'samples': 2318208, 'steps': 12073, 'loss/train': 1.4593292474746704} +11/06/2021 22:55:05 - INFO - __main__ - Step 12075: {'lr': 0.0004943057747125371, 'samples': 2318400, 'steps': 12074, 'loss/train': 1.8841195106506348} +11/06/2021 22:55:06 - INFO - __main__ - Step 12076: {'lr': 0.0004943046484891352, 'samples': 2318592, 'steps': 12075, 'loss/train': 1.3961201906204224} +11/06/2021 22:55:06 - INFO - __main__ - Step 12077: {'lr': 0.0004943035221556536, 'samples': 2318784, 'steps': 12076, 'loss/train': 1.4814202785491943} +11/06/2021 22:55:07 - INFO - __main__ - Step 12078: {'lr': 0.0004943023957120926, 'samples': 2318976, 'steps': 12077, 'loss/train': 1.8115047216415405} +11/06/2021 22:55:07 - INFO - __main__ - Step 12079: {'lr': 0.0004943012691584526, 'samples': 2319168, 'steps': 12078, 'loss/train': 1.6468000411987305} +11/06/2021 22:55:08 - INFO - __main__ - Step 12080: {'lr': 0.0004943001424947343, 'samples': 2319360, 'steps': 12079, 'loss/train': 2.1361162662506104} +11/06/2021 22:55:08 - INFO - __main__ - Step 12081: {'lr': 0.000494299015720938, 'samples': 2319552, 'steps': 12080, 'loss/train': 1.2885714769363403} +11/06/2021 22:55:08 - INFO - __main__ - Step 12082: {'lr': 0.0004942978888370645, 'samples': 2319744, 'steps': 12081, 'loss/train': 2.0774118900299072} +11/06/2021 22:55:10 - INFO - __main__ - Step 12083: {'lr': 0.000494296761843114, 'samples': 2319936, 'steps': 12082, 'loss/train': 1.5701794624328613} +11/06/2021 22:55:10 - INFO - __main__ - Step 12084: {'lr': 0.0004942956347390872, 'samples': 2320128, 'steps': 12083, 'loss/train': 1.1753841638565063} +11/06/2021 22:55:11 - INFO - __main__ - Step 12085: {'lr': 0.0004942945075249845, 'samples': 2320320, 'steps': 12084, 'loss/train': 1.6543172597885132} +11/06/2021 22:55:11 - INFO - __main__ - Step 12086: {'lr': 0.0004942933802008066, 'samples': 2320512, 'steps': 12085, 'loss/train': 2.0663843154907227} +11/06/2021 22:55:12 - INFO - __main__ - Step 12087: {'lr': 0.0004942922527665538, 'samples': 2320704, 'steps': 12086, 'loss/train': 1.5923895835876465} +11/06/2021 22:55:12 - INFO - __main__ - Step 12088: {'lr': 0.0004942911252222267, 'samples': 2320896, 'steps': 12087, 'loss/train': 0.7742838263511658} +11/06/2021 22:55:12 - INFO - __main__ - Step 12089: {'lr': 0.0004942899975678257, 'samples': 2321088, 'steps': 12088, 'loss/train': 1.9447110891342163} +11/06/2021 22:55:13 - INFO - __main__ - Step 12090: {'lr': 0.0004942888698033515, 'samples': 2321280, 'steps': 12089, 'loss/train': 1.889116883277893} +11/06/2021 22:55:14 - INFO - __main__ - Step 12091: {'lr': 0.0004942877419288045, 'samples': 2321472, 'steps': 12090, 'loss/train': 1.8266593217849731} +11/06/2021 22:55:14 - INFO - __main__ - Step 12092: {'lr': 0.0004942866139441851, 'samples': 2321664, 'steps': 12091, 'loss/train': 1.2201491594314575} +11/06/2021 22:55:14 - INFO - __main__ - Step 12093: {'lr': 0.0004942854858494941, 'samples': 2321856, 'steps': 12092, 'loss/train': 1.8048791885375977} +11/06/2021 22:55:15 - INFO - __main__ - Step 12094: {'lr': 0.0004942843576447316, 'samples': 2322048, 'steps': 12093, 'loss/train': 1.6451750993728638} +11/06/2021 22:55:15 - INFO - __main__ - Step 12095: {'lr': 0.0004942832293298986, 'samples': 2322240, 'steps': 12094, 'loss/train': 1.459704041481018} +11/06/2021 22:55:16 - INFO - __main__ - Step 12096: {'lr': 0.0004942821009049952, 'samples': 2322432, 'steps': 12095, 'loss/train': 2.0811355113983154} +11/06/2021 22:55:16 - INFO - __main__ - Step 12097: {'lr': 0.0004942809723700221, 'samples': 2322624, 'steps': 12096, 'loss/train': 1.5584614276885986} +11/06/2021 22:55:17 - INFO - __main__ - Step 12098: {'lr': 0.0004942798437249797, 'samples': 2322816, 'steps': 12097, 'loss/train': 1.5112113952636719} +11/06/2021 22:55:17 - INFO - __main__ - Step 12099: {'lr': 0.0004942787149698687, 'samples': 2323008, 'steps': 12098, 'loss/train': 1.9871211051940918} +11/06/2021 22:55:17 - INFO - __main__ - Step 12100: {'lr': 0.0004942775861046893, 'samples': 2323200, 'steps': 12099, 'loss/train': 2.562870740890503} +11/06/2021 22:55:18 - INFO - __main__ - Step 12101: {'lr': 0.0004942764571294422, 'samples': 2323392, 'steps': 12100, 'loss/train': 1.39982008934021} +11/06/2021 22:55:19 - INFO - __main__ - Step 12102: {'lr': 0.0004942753280441281, 'samples': 2323584, 'steps': 12101, 'loss/train': 2.016968250274658} +11/06/2021 22:55:19 - INFO - __main__ - Step 12103: {'lr': 0.0004942741988487471, 'samples': 2323776, 'steps': 12102, 'loss/train': 1.8526740074157715} +11/06/2021 22:55:19 - INFO - __main__ - Step 12104: {'lr': 0.0004942730695433001, 'samples': 2323968, 'steps': 12103, 'loss/train': 1.4173227548599243} +11/06/2021 22:55:20 - INFO - __main__ - Step 12105: {'lr': 0.0004942719401277873, 'samples': 2324160, 'steps': 12104, 'loss/train': 1.0924817323684692} +11/06/2021 22:55:21 - INFO - __main__ - Step 12106: {'lr': 0.0004942708106022094, 'samples': 2324352, 'steps': 12105, 'loss/train': 1.5277026891708374} +11/06/2021 22:55:21 - INFO - __main__ - Step 12107: {'lr': 0.0004942696809665668, 'samples': 2324544, 'steps': 12106, 'loss/train': 1.9903008937835693} +11/06/2021 22:55:21 - INFO - __main__ - Step 12108: {'lr': 0.0004942685512208599, 'samples': 2324736, 'steps': 12107, 'loss/train': 1.1875405311584473} +11/06/2021 22:55:22 - INFO - __main__ - Step 12109: {'lr': 0.0004942674213650896, 'samples': 2324928, 'steps': 12108, 'loss/train': 1.4761584997177124} +11/06/2021 22:55:22 - INFO - __main__ - Step 12110: {'lr': 0.000494266291399256, 'samples': 2325120, 'steps': 12109, 'loss/train': 1.6016489267349243} +11/06/2021 22:55:23 - INFO - __main__ - Step 12111: {'lr': 0.0004942651613233599, 'samples': 2325312, 'steps': 12110, 'loss/train': 1.8227951526641846} +11/06/2021 22:55:24 - INFO - __main__ - Step 12112: {'lr': 0.0004942640311374017, 'samples': 2325504, 'steps': 12111, 'loss/train': 1.8934657573699951} +11/06/2021 22:55:24 - INFO - __main__ - Step 12113: {'lr': 0.0004942629008413818, 'samples': 2325696, 'steps': 12112, 'loss/train': 1.4961217641830444} +11/06/2021 22:55:24 - INFO - __main__ - Step 12114: {'lr': 0.0004942617704353008, 'samples': 2325888, 'steps': 12113, 'loss/train': 1.5559004545211792} +11/06/2021 22:55:25 - INFO - __main__ - Step 12115: {'lr': 0.0004942606399191593, 'samples': 2326080, 'steps': 12114, 'loss/train': 1.4733009338378906} +11/06/2021 22:55:25 - INFO - __main__ - Step 12116: {'lr': 0.0004942595092929577, 'samples': 2326272, 'steps': 12115, 'loss/train': 1.756181240081787} +11/06/2021 22:55:27 - INFO - __main__ - Step 12117: {'lr': 0.0004942583785566965, 'samples': 2326464, 'steps': 12116, 'loss/train': 1.810673475265503} +11/06/2021 22:55:27 - INFO - __main__ - Step 12118: {'lr': 0.0004942572477103763, 'samples': 2326656, 'steps': 12117, 'loss/train': 1.341216802597046} +11/06/2021 22:55:27 - INFO - __main__ - Step 12119: {'lr': 0.0004942561167539975, 'samples': 2326848, 'steps': 12118, 'loss/train': 1.2394644021987915} +11/06/2021 22:55:28 - INFO - __main__ - Step 12120: {'lr': 0.0004942549856875606, 'samples': 2327040, 'steps': 12119, 'loss/train': 1.7882914543151855} +11/06/2021 22:55:28 - INFO - __main__ - Step 12121: {'lr': 0.0004942538545110663, 'samples': 2327232, 'steps': 12120, 'loss/train': 1.967432975769043} +11/06/2021 22:55:29 - INFO - __main__ - Step 12122: {'lr': 0.0004942527232245149, 'samples': 2327424, 'steps': 12121, 'loss/train': 2.7210159301757812} +11/06/2021 22:55:30 - INFO - __main__ - Step 12123: {'lr': 0.0004942515918279071, 'samples': 2327616, 'steps': 12122, 'loss/train': 1.1575158834457397} +11/06/2021 22:55:30 - INFO - __main__ - Step 12124: {'lr': 0.0004942504603212433, 'samples': 2327808, 'steps': 12123, 'loss/train': 1.8473913669586182} +11/06/2021 22:55:30 - INFO - __main__ - Step 12125: {'lr': 0.0004942493287045239, 'samples': 2328000, 'steps': 12124, 'loss/train': 1.3073318004608154} +11/06/2021 22:55:31 - INFO - __main__ - Step 12126: {'lr': 0.0004942481969777495, 'samples': 2328192, 'steps': 12125, 'loss/train': 2.258380889892578} +11/06/2021 22:55:31 - INFO - __main__ - Step 12127: {'lr': 0.0004942470651409207, 'samples': 2328384, 'steps': 12126, 'loss/train': 1.8729878664016724} +11/06/2021 22:55:32 - INFO - __main__ - Step 12128: {'lr': 0.000494245933194038, 'samples': 2328576, 'steps': 12127, 'loss/train': 1.1568888425827026} +11/06/2021 22:55:33 - INFO - __main__ - Step 12129: {'lr': 0.0004942448011371018, 'samples': 2328768, 'steps': 12128, 'loss/train': 1.8721987009048462} +11/06/2021 22:55:33 - INFO - __main__ - Step 12130: {'lr': 0.0004942436689701126, 'samples': 2328960, 'steps': 12129, 'loss/train': 1.7959274053573608} +11/06/2021 22:55:33 - INFO - __main__ - Step 12131: {'lr': 0.000494242536693071, 'samples': 2329152, 'steps': 12130, 'loss/train': 1.718927264213562} +11/06/2021 22:55:34 - INFO - __main__ - Step 12132: {'lr': 0.0004942414043059776, 'samples': 2329344, 'steps': 12131, 'loss/train': 1.8697373867034912} +11/06/2021 22:55:35 - INFO - __main__ - Step 12133: {'lr': 0.0004942402718088326, 'samples': 2329536, 'steps': 12132, 'loss/train': 1.8126624822616577} +11/06/2021 22:55:35 - INFO - __main__ - Step 12134: {'lr': 0.0004942391392016368, 'samples': 2329728, 'steps': 12133, 'loss/train': 1.6488497257232666} +11/06/2021 22:55:35 - INFO - __main__ - Step 12135: {'lr': 0.0004942380064843906, 'samples': 2329920, 'steps': 12134, 'loss/train': 1.8256616592407227} +11/06/2021 22:55:36 - INFO - __main__ - Step 12136: {'lr': 0.0004942368736570946, 'samples': 2330112, 'steps': 12135, 'loss/train': 1.4627264738082886} +11/06/2021 22:55:36 - INFO - __main__ - Step 12137: {'lr': 0.0004942357407197491, 'samples': 2330304, 'steps': 12136, 'loss/train': 1.6289029121398926} +11/06/2021 22:55:37 - INFO - __main__ - Step 12138: {'lr': 0.0004942346076723548, 'samples': 2330496, 'steps': 12137, 'loss/train': 1.9620447158813477} +11/06/2021 22:55:38 - INFO - __main__ - Step 12139: {'lr': 0.0004942334745149122, 'samples': 2330688, 'steps': 12138, 'loss/train': 2.0332870483398438} +11/06/2021 22:55:38 - INFO - __main__ - Step 12140: {'lr': 0.0004942323412474218, 'samples': 2330880, 'steps': 12139, 'loss/train': 1.301571249961853} +11/06/2021 22:55:38 - INFO - __main__ - Step 12141: {'lr': 0.000494231207869884, 'samples': 2331072, 'steps': 12140, 'loss/train': 1.325974941253662} +11/06/2021 22:55:39 - INFO - __main__ - Step 12142: {'lr': 0.0004942300743822993, 'samples': 2331264, 'steps': 12141, 'loss/train': 1.419464111328125} +11/06/2021 22:55:40 - INFO - __main__ - Step 12143: {'lr': 0.0004942289407846684, 'samples': 2331456, 'steps': 12142, 'loss/train': 0.5399057865142822} +11/06/2021 22:55:40 - INFO - __main__ - Step 12144: {'lr': 0.0004942278070769917, 'samples': 2331648, 'steps': 12143, 'loss/train': 1.7828236818313599} +11/06/2021 22:55:40 - INFO - __main__ - Step 12145: {'lr': 0.0004942266732592697, 'samples': 2331840, 'steps': 12144, 'loss/train': 1.8341064453125} +11/06/2021 22:55:41 - INFO - __main__ - Step 12146: {'lr': 0.0004942255393315029, 'samples': 2332032, 'steps': 12145, 'loss/train': 1.1581087112426758} +11/06/2021 22:55:41 - INFO - __main__ - Step 12147: {'lr': 0.000494224405293692, 'samples': 2332224, 'steps': 12146, 'loss/train': 1.870377779006958} +11/06/2021 22:55:41 - INFO - __main__ - Step 12148: {'lr': 0.0004942232711458372, 'samples': 2332416, 'steps': 12147, 'loss/train': 1.5845227241516113} +11/06/2021 22:55:42 - INFO - __main__ - Step 12149: {'lr': 0.0004942221368879391, 'samples': 2332608, 'steps': 12148, 'loss/train': 1.2885611057281494} +11/06/2021 22:55:43 - INFO - __main__ - Step 12150: {'lr': 0.0004942210025199985, 'samples': 2332800, 'steps': 12149, 'loss/train': 1.941924810409546} +11/06/2021 22:55:43 - INFO - __main__ - Step 12151: {'lr': 0.0004942198680420155, 'samples': 2332992, 'steps': 12150, 'loss/train': 1.2128046751022339} +11/06/2021 22:55:43 - INFO - __main__ - Step 12152: {'lr': 0.0004942187334539908, 'samples': 2333184, 'steps': 12151, 'loss/train': 1.949316382408142} +11/06/2021 22:55:44 - INFO - __main__ - Step 12153: {'lr': 0.0004942175987559251, 'samples': 2333376, 'steps': 12152, 'loss/train': 3.1983020305633545} +11/06/2021 22:55:45 - INFO - __main__ - Step 12154: {'lr': 0.0004942164639478185, 'samples': 2333568, 'steps': 12153, 'loss/train': 2.0099000930786133} +11/06/2021 22:55:45 - INFO - __main__ - Step 12155: {'lr': 0.0004942153290296718, 'samples': 2333760, 'steps': 12154, 'loss/train': 2.0011119842529297} +11/06/2021 22:55:45 - INFO - __main__ - Step 12156: {'lr': 0.0004942141940014854, 'samples': 2333952, 'steps': 12155, 'loss/train': 1.7409350872039795} +11/06/2021 22:55:46 - INFO - __main__ - Step 12157: {'lr': 0.0004942130588632599, 'samples': 2334144, 'steps': 12156, 'loss/train': 2.0252602100372314} +11/06/2021 22:55:46 - INFO - __main__ - Step 12158: {'lr': 0.0004942119236149958, 'samples': 2334336, 'steps': 12157, 'loss/train': 1.6826229095458984} +11/06/2021 22:55:47 - INFO - __main__ - Step 12159: {'lr': 0.0004942107882566936, 'samples': 2334528, 'steps': 12158, 'loss/train': 1.7889363765716553} +11/06/2021 22:55:47 - INFO - __main__ - Step 12160: {'lr': 0.0004942096527883538, 'samples': 2334720, 'steps': 12159, 'loss/train': 1.4643501043319702} +11/06/2021 22:55:48 - INFO - __main__ - Step 12161: {'lr': 0.0004942085172099768, 'samples': 2334912, 'steps': 12160, 'loss/train': 1.5718570947647095} +11/06/2021 22:55:48 - INFO - __main__ - Step 12162: {'lr': 0.0004942073815215632, 'samples': 2335104, 'steps': 12161, 'loss/train': 1.6668059825897217} +11/06/2021 22:55:49 - INFO - __main__ - Step 12163: {'lr': 0.0004942062457231136, 'samples': 2335296, 'steps': 12162, 'loss/train': 1.9814776182174683} +11/06/2021 22:55:50 - INFO - __main__ - Step 12164: {'lr': 0.0004942051098146284, 'samples': 2335488, 'steps': 12163, 'loss/train': 1.9286428689956665} +11/06/2021 22:55:50 - INFO - __main__ - Step 12165: {'lr': 0.0004942039737961081, 'samples': 2335680, 'steps': 12164, 'loss/train': 1.8754050731658936} +11/06/2021 22:55:50 - INFO - __main__ - Step 12166: {'lr': 0.0004942028376675533, 'samples': 2335872, 'steps': 12165, 'loss/train': 1.3288780450820923} +11/06/2021 22:55:51 - INFO - __main__ - Step 12167: {'lr': 0.0004942017014289645, 'samples': 2336064, 'steps': 12166, 'loss/train': 1.694525957107544} +11/06/2021 22:55:51 - INFO - __main__ - Step 12168: {'lr': 0.0004942005650803421, 'samples': 2336256, 'steps': 12167, 'loss/train': 1.5838422775268555} +11/06/2021 22:55:51 - INFO - __main__ - Step 12169: {'lr': 0.0004941994286216867, 'samples': 2336448, 'steps': 12168, 'loss/train': 1.7149986028671265} +11/06/2021 22:55:52 - INFO - __main__ - Step 12170: {'lr': 0.0004941982920529989, 'samples': 2336640, 'steps': 12169, 'loss/train': 1.529640793800354} +11/06/2021 22:55:53 - INFO - __main__ - Step 12171: {'lr': 0.0004941971553742791, 'samples': 2336832, 'steps': 12170, 'loss/train': 1.0539520978927612} +11/06/2021 22:55:53 - INFO - __main__ - Step 12172: {'lr': 0.0004941960185855278, 'samples': 2337024, 'steps': 12171, 'loss/train': 2.0904853343963623} +11/06/2021 22:55:53 - INFO - __main__ - Step 12173: {'lr': 0.0004941948816867455, 'samples': 2337216, 'steps': 12172, 'loss/train': 1.5987201929092407} +11/06/2021 22:55:54 - INFO - __main__ - Step 12174: {'lr': 0.0004941937446779328, 'samples': 2337408, 'steps': 12173, 'loss/train': 1.9558372497558594} +11/06/2021 22:55:55 - INFO - __main__ - Step 12175: {'lr': 0.0004941926075590901, 'samples': 2337600, 'steps': 12174, 'loss/train': 1.9326342344284058} +11/06/2021 22:55:55 - INFO - __main__ - Step 12176: {'lr': 0.0004941914703302181, 'samples': 2337792, 'steps': 12175, 'loss/train': 1.5912054777145386} +11/06/2021 22:55:55 - INFO - __main__ - Step 12177: {'lr': 0.0004941903329913172, 'samples': 2337984, 'steps': 12176, 'loss/train': 1.657957911491394} +11/06/2021 22:55:56 - INFO - __main__ - Step 12178: {'lr': 0.0004941891955423878, 'samples': 2338176, 'steps': 12177, 'loss/train': 2.281742811203003} +11/06/2021 22:55:56 - INFO - __main__ - Step 12179: {'lr': 0.0004941880579834306, 'samples': 2338368, 'steps': 12178, 'loss/train': 1.9655019044876099} +11/06/2021 22:55:57 - INFO - __main__ - Step 12180: {'lr': 0.0004941869203144459, 'samples': 2338560, 'steps': 12179, 'loss/train': 0.7616149187088013} +11/06/2021 22:55:58 - INFO - __main__ - Step 12181: {'lr': 0.0004941857825354344, 'samples': 2338752, 'steps': 12180, 'loss/train': 1.607176423072815} +11/06/2021 22:55:58 - INFO - __main__ - Step 12182: {'lr': 0.0004941846446463966, 'samples': 2338944, 'steps': 12181, 'loss/train': 1.9033536911010742} +11/06/2021 22:55:58 - INFO - __main__ - Step 12183: {'lr': 0.000494183506647333, 'samples': 2339136, 'steps': 12182, 'loss/train': 1.972430944442749} +11/06/2021 22:55:59 - INFO - __main__ - Step 12184: {'lr': 0.000494182368538244, 'samples': 2339328, 'steps': 12183, 'loss/train': 1.4964816570281982} +11/06/2021 22:56:00 - INFO - __main__ - Step 12185: {'lr': 0.0004941812303191302, 'samples': 2339520, 'steps': 12184, 'loss/train': 1.8058403730392456} +11/06/2021 22:56:00 - INFO - __main__ - Step 12186: {'lr': 0.0004941800919899921, 'samples': 2339712, 'steps': 12185, 'loss/train': 1.9677493572235107} +11/06/2021 22:56:00 - INFO - __main__ - Step 12187: {'lr': 0.0004941789535508303, 'samples': 2339904, 'steps': 12186, 'loss/train': 1.774878978729248} +11/06/2021 22:56:01 - INFO - __main__ - Step 12188: {'lr': 0.0004941778150016451, 'samples': 2340096, 'steps': 12187, 'loss/train': 1.5408471822738647} +11/06/2021 22:56:01 - INFO - __main__ - Step 12189: {'lr': 0.0004941766763424373, 'samples': 2340288, 'steps': 12188, 'loss/train': 1.433286190032959} +11/06/2021 22:56:02 - INFO - __main__ - Step 12190: {'lr': 0.0004941755375732071, 'samples': 2340480, 'steps': 12189, 'loss/train': 1.7328075170516968} +11/06/2021 22:56:02 - INFO - __main__ - Step 12191: {'lr': 0.0004941743986939553, 'samples': 2340672, 'steps': 12190, 'loss/train': 1.647670030593872} +11/06/2021 22:56:03 - INFO - __main__ - Step 12192: {'lr': 0.0004941732597046822, 'samples': 2340864, 'steps': 12191, 'loss/train': 1.4415473937988281} +11/06/2021 22:56:03 - INFO - __main__ - Step 12193: {'lr': 0.0004941721206053885, 'samples': 2341056, 'steps': 12192, 'loss/train': 3.6256818771362305} +11/06/2021 22:56:04 - INFO - __main__ - Step 12194: {'lr': 0.0004941709813960745, 'samples': 2341248, 'steps': 12193, 'loss/train': 1.5252056121826172} +11/06/2021 22:56:05 - INFO - __main__ - Step 12195: {'lr': 0.0004941698420767408, 'samples': 2341440, 'steps': 12194, 'loss/train': 1.3925776481628418} +11/06/2021 22:56:05 - INFO - __main__ - Step 12196: {'lr': 0.0004941687026473881, 'samples': 2341632, 'steps': 12195, 'loss/train': 0.3151058852672577} +11/06/2021 22:56:05 - INFO - __main__ - Step 12197: {'lr': 0.0004941675631080166, 'samples': 2341824, 'steps': 12196, 'loss/train': 2.0778465270996094} +11/06/2021 22:56:06 - INFO - __main__ - Step 12198: {'lr': 0.000494166423458627, 'samples': 2342016, 'steps': 12197, 'loss/train': 2.043381929397583} +11/06/2021 22:56:06 - INFO - __main__ - Step 12199: {'lr': 0.0004941652836992198, 'samples': 2342208, 'steps': 12198, 'loss/train': 1.0915753841400146} +11/06/2021 22:56:06 - INFO - __main__ - Step 12200: {'lr': 0.0004941641438297955, 'samples': 2342400, 'steps': 12199, 'loss/train': 1.6756670475006104} +11/06/2021 22:56:07 - INFO - __main__ - Step 12201: {'lr': 0.0004941630038503545, 'samples': 2342592, 'steps': 12200, 'loss/train': 1.9415992498397827} +11/06/2021 22:56:08 - INFO - __main__ - Step 12202: {'lr': 0.0004941618637608976, 'samples': 2342784, 'steps': 12201, 'loss/train': 2.4285848140716553} +11/06/2021 22:56:08 - INFO - __main__ - Step 12203: {'lr': 0.000494160723561425, 'samples': 2342976, 'steps': 12202, 'loss/train': 0.7406458854675293} +11/06/2021 22:56:08 - INFO - __main__ - Step 12204: {'lr': 0.0004941595832519374, 'samples': 2343168, 'steps': 12203, 'loss/train': 1.799933910369873} +11/06/2021 22:56:09 - INFO - __main__ - Step 12205: {'lr': 0.0004941584428324352, 'samples': 2343360, 'steps': 12204, 'loss/train': 1.6155633926391602} +11/06/2021 22:56:10 - INFO - __main__ - Step 12206: {'lr': 0.000494157302302919, 'samples': 2343552, 'steps': 12205, 'loss/train': 1.4476592540740967} +11/06/2021 22:56:10 - INFO - __main__ - Step 12207: {'lr': 0.0004941561616633893, 'samples': 2343744, 'steps': 12206, 'loss/train': 1.3193042278289795} +11/06/2021 22:56:11 - INFO - __main__ - Step 12208: {'lr': 0.0004941550209138466, 'samples': 2343936, 'steps': 12207, 'loss/train': 0.9178276062011719} +11/06/2021 22:56:11 - INFO - __main__ - Step 12209: {'lr': 0.0004941538800542915, 'samples': 2344128, 'steps': 12208, 'loss/train': 2.1289122104644775} +11/06/2021 22:56:11 - INFO - __main__ - Step 12210: {'lr': 0.0004941527390847243, 'samples': 2344320, 'steps': 12209, 'loss/train': 1.1334985494613647} +11/06/2021 22:56:12 - INFO - __main__ - Step 12211: {'lr': 0.0004941515980051457, 'samples': 2344512, 'steps': 12210, 'loss/train': 1.8072400093078613} +11/06/2021 22:56:13 - INFO - __main__ - Step 12212: {'lr': 0.0004941504568155561, 'samples': 2344704, 'steps': 12211, 'loss/train': 2.0195960998535156} +11/06/2021 22:56:13 - INFO - __main__ - Step 12213: {'lr': 0.0004941493155159562, 'samples': 2344896, 'steps': 12212, 'loss/train': 1.8710730075836182} +11/06/2021 22:56:13 - INFO - __main__ - Step 12214: {'lr': 0.0004941481741063462, 'samples': 2345088, 'steps': 12213, 'loss/train': 6.926916599273682} +11/06/2021 22:56:14 - INFO - __main__ - Step 12215: {'lr': 0.000494147032586727, 'samples': 2345280, 'steps': 12214, 'loss/train': 1.6592782735824585} +11/06/2021 22:56:14 - INFO - __main__ - Step 12216: {'lr': 0.0004941458909570988, 'samples': 2345472, 'steps': 12215, 'loss/train': 2.1829493045806885} +11/06/2021 22:56:14 - INFO - __main__ - Step 12217: {'lr': 0.0004941447492174622, 'samples': 2345664, 'steps': 12216, 'loss/train': 1.9610031843185425} +11/06/2021 22:56:15 - INFO - __main__ - Step 12218: {'lr': 0.0004941436073678179, 'samples': 2345856, 'steps': 12217, 'loss/train': 1.678484320640564} +11/06/2021 22:56:16 - INFO - __main__ - Step 12219: {'lr': 0.0004941424654081661, 'samples': 2346048, 'steps': 12218, 'loss/train': 1.9036375284194946} +11/06/2021 22:56:16 - INFO - __main__ - Step 12220: {'lr': 0.0004941413233385075, 'samples': 2346240, 'steps': 12219, 'loss/train': 1.5224061012268066} +11/06/2021 22:56:16 - INFO - __main__ - Step 12221: {'lr': 0.0004941401811588426, 'samples': 2346432, 'steps': 12220, 'loss/train': 1.5389779806137085} +11/06/2021 22:56:17 - INFO - __main__ - Step 12222: {'lr': 0.0004941390388691719, 'samples': 2346624, 'steps': 12221, 'loss/train': 1.6822108030319214} +11/06/2021 22:56:18 - INFO - __main__ - Step 12223: {'lr': 0.0004941378964694959, 'samples': 2346816, 'steps': 12222, 'loss/train': 1.6283819675445557} +11/06/2021 22:56:18 - INFO - __main__ - Step 12224: {'lr': 0.0004941367539598152, 'samples': 2347008, 'steps': 12223, 'loss/train': 2.0302186012268066} +11/06/2021 22:56:19 - INFO - __main__ - Step 12225: {'lr': 0.0004941356113401301, 'samples': 2347200, 'steps': 12224, 'loss/train': 1.9460519552230835} +11/06/2021 22:56:19 - INFO - __main__ - Step 12226: {'lr': 0.0004941344686104414, 'samples': 2347392, 'steps': 12225, 'loss/train': 1.5134607553482056} +11/06/2021 22:56:19 - INFO - __main__ - Step 12227: {'lr': 0.0004941333257707495, 'samples': 2347584, 'steps': 12226, 'loss/train': 1.468488097190857} +11/06/2021 22:56:20 - INFO - __main__ - Step 12228: {'lr': 0.0004941321828210548, 'samples': 2347776, 'steps': 12227, 'loss/train': 1.6733677387237549} +11/06/2021 22:56:21 - INFO - __main__ - Step 12229: {'lr': 0.000494131039761358, 'samples': 2347968, 'steps': 12228, 'loss/train': 1.7591148614883423} +11/06/2021 22:56:21 - INFO - __main__ - Step 12230: {'lr': 0.0004941298965916594, 'samples': 2348160, 'steps': 12229, 'loss/train': 7.689951419830322} +11/06/2021 22:56:21 - INFO - __main__ - Step 12231: {'lr': 0.0004941287533119597, 'samples': 2348352, 'steps': 12230, 'loss/train': 1.1296072006225586} +11/06/2021 22:56:22 - INFO - __main__ - Step 12232: {'lr': 0.0004941276099222593, 'samples': 2348544, 'steps': 12231, 'loss/train': 1.8858994245529175} +11/06/2021 22:56:22 - INFO - __main__ - Step 12233: {'lr': 0.0004941264664225589, 'samples': 2348736, 'steps': 12232, 'loss/train': 1.4118883609771729} +11/06/2021 22:56:23 - INFO - __main__ - Step 12234: {'lr': 0.0004941253228128588, 'samples': 2348928, 'steps': 12233, 'loss/train': 2.075518846511841} +11/06/2021 22:56:24 - INFO - __main__ - Step 12235: {'lr': 0.0004941241790931595, 'samples': 2349120, 'steps': 12234, 'loss/train': 1.6000714302062988} +11/06/2021 22:56:24 - INFO - __main__ - Step 12236: {'lr': 0.0004941230352634617, 'samples': 2349312, 'steps': 12235, 'loss/train': 1.9275367259979248} +11/06/2021 22:56:24 - INFO - __main__ - Step 12237: {'lr': 0.0004941218913237658, 'samples': 2349504, 'steps': 12236, 'loss/train': 2.1970300674438477} +11/06/2021 22:56:25 - INFO - __main__ - Step 12238: {'lr': 0.0004941207472740724, 'samples': 2349696, 'steps': 12237, 'loss/train': 1.9084161520004272} +11/06/2021 22:56:26 - INFO - __main__ - Step 12239: {'lr': 0.000494119603114382, 'samples': 2349888, 'steps': 12238, 'loss/train': 2.308227062225342} +11/06/2021 22:56:26 - INFO - __main__ - Step 12240: {'lr': 0.000494118458844695, 'samples': 2350080, 'steps': 12239, 'loss/train': 2.078315019607544} +11/06/2021 22:56:26 - INFO - __main__ - Step 12241: {'lr': 0.0004941173144650119, 'samples': 2350272, 'steps': 12240, 'loss/train': 1.4600110054016113} +11/06/2021 22:56:27 - INFO - __main__ - Step 12242: {'lr': 0.0004941161699753335, 'samples': 2350464, 'steps': 12241, 'loss/train': 2.5496790409088135} +11/06/2021 22:56:27 - INFO - __main__ - Step 12243: {'lr': 0.00049411502537566, 'samples': 2350656, 'steps': 12242, 'loss/train': 1.7416751384735107} +11/06/2021 22:56:28 - INFO - __main__ - Step 12244: {'lr': 0.0004941138806659921, 'samples': 2350848, 'steps': 12243, 'loss/train': 1.8958357572555542} +11/06/2021 22:56:29 - INFO - __main__ - Step 12245: {'lr': 0.00049411273584633, 'samples': 2351040, 'steps': 12244, 'loss/train': 1.8675121068954468} +11/06/2021 22:56:29 - INFO - __main__ - Step 12246: {'lr': 0.0004941115909166748, 'samples': 2351232, 'steps': 12245, 'loss/train': 1.8117626905441284} +11/06/2021 22:56:29 - INFO - __main__ - Step 12247: {'lr': 0.0004941104458770266, 'samples': 2351424, 'steps': 12246, 'loss/train': 1.715092420578003} +11/06/2021 22:56:30 - INFO - __main__ - Step 12248: {'lr': 0.0004941093007273859, 'samples': 2351616, 'steps': 12247, 'loss/train': 2.001997470855713} +11/06/2021 22:56:30 - INFO - __main__ - Step 12249: {'lr': 0.0004941081554677534, 'samples': 2351808, 'steps': 12248, 'loss/train': 1.8709745407104492} +11/06/2021 22:56:31 - INFO - __main__ - Step 12250: {'lr': 0.0004941070100981295, 'samples': 2352000, 'steps': 12249, 'loss/train': 2.0071144104003906} +11/06/2021 22:56:32 - INFO - __main__ - Step 12251: {'lr': 0.0004941058646185148, 'samples': 2352192, 'steps': 12250, 'loss/train': 1.7076789140701294} +11/06/2021 22:56:32 - INFO - __main__ - Step 12252: {'lr': 0.0004941047190289096, 'samples': 2352384, 'steps': 12251, 'loss/train': 2.314211845397949} +11/06/2021 22:56:32 - INFO - __main__ - Step 12253: {'lr': 0.0004941035733293148, 'samples': 2352576, 'steps': 12252, 'loss/train': 2.0742650032043457} +11/06/2021 22:56:33 - INFO - __main__ - Step 12254: {'lr': 0.0004941024275197305, 'samples': 2352768, 'steps': 12253, 'loss/train': 1.7907441854476929} +11/06/2021 22:56:34 - INFO - __main__ - Step 12255: {'lr': 0.0004941012816001575, 'samples': 2352960, 'steps': 12254, 'loss/train': 1.6902923583984375} +11/06/2021 22:56:34 - INFO - __main__ - Step 12256: {'lr': 0.0004941001355705963, 'samples': 2353152, 'steps': 12255, 'loss/train': 1.4194196462631226} +11/06/2021 22:56:34 - INFO - __main__ - Step 12257: {'lr': 0.0004940989894310473, 'samples': 2353344, 'steps': 12256, 'loss/train': 2.029238224029541} +11/06/2021 22:56:35 - INFO - __main__ - Step 12258: {'lr': 0.000494097843181511, 'samples': 2353536, 'steps': 12257, 'loss/train': 1.5298515558242798} +11/06/2021 22:56:35 - INFO - __main__ - Step 12259: {'lr': 0.0004940966968219881, 'samples': 2353728, 'steps': 12258, 'loss/train': 1.807405948638916} +11/06/2021 22:56:35 - INFO - __main__ - Step 12260: {'lr': 0.0004940955503524789, 'samples': 2353920, 'steps': 12259, 'loss/train': 1.857525110244751} +11/06/2021 22:56:36 - INFO - __main__ - Step 12261: {'lr': 0.000494094403772984, 'samples': 2354112, 'steps': 12260, 'loss/train': 1.2936711311340332} +11/06/2021 22:56:37 - INFO - __main__ - Step 12262: {'lr': 0.0004940932570835039, 'samples': 2354304, 'steps': 12261, 'loss/train': 1.5933314561843872} +11/06/2021 22:56:37 - INFO - __main__ - Step 12263: {'lr': 0.0004940921102840393, 'samples': 2354496, 'steps': 12262, 'loss/train': 1.8495118618011475} +11/06/2021 22:56:37 - INFO - __main__ - Step 12264: {'lr': 0.0004940909633745905, 'samples': 2354688, 'steps': 12263, 'loss/train': 1.749647617340088} +11/06/2021 22:56:38 - INFO - __main__ - Step 12265: {'lr': 0.000494089816355158, 'samples': 2354880, 'steps': 12264, 'loss/train': 1.2525612115859985} +11/06/2021 22:56:39 - INFO - __main__ - Step 12266: {'lr': 0.0004940886692257424, 'samples': 2355072, 'steps': 12265, 'loss/train': 1.6700724363327026} +11/06/2021 22:56:40 - INFO - __main__ - Step 12267: {'lr': 0.0004940875219863443, 'samples': 2355264, 'steps': 12266, 'loss/train': 1.503882646560669} +11/06/2021 22:56:40 - INFO - __main__ - Step 12268: {'lr': 0.0004940863746369641, 'samples': 2355456, 'steps': 12267, 'loss/train': 1.7664172649383545} +11/06/2021 22:56:40 - INFO - __main__ - Step 12269: {'lr': 0.0004940852271776023, 'samples': 2355648, 'steps': 12268, 'loss/train': 1.7359364032745361} +11/06/2021 22:56:41 - INFO - __main__ - Step 12270: {'lr': 0.0004940840796082594, 'samples': 2355840, 'steps': 12269, 'loss/train': 1.848609447479248} +11/06/2021 22:56:41 - INFO - __main__ - Step 12271: {'lr': 0.0004940829319289361, 'samples': 2356032, 'steps': 12270, 'loss/train': 1.8408467769622803} +11/06/2021 22:56:42 - INFO - __main__ - Step 12272: {'lr': 0.0004940817841396327, 'samples': 2356224, 'steps': 12271, 'loss/train': 1.7952295541763306} +11/06/2021 22:56:42 - INFO - __main__ - Step 12273: {'lr': 0.0004940806362403499, 'samples': 2356416, 'steps': 12272, 'loss/train': 2.3083720207214355} +11/06/2021 22:56:43 - INFO - __main__ - Step 12274: {'lr': 0.0004940794882310882, 'samples': 2356608, 'steps': 12273, 'loss/train': 1.8015666007995605} +11/06/2021 22:56:43 - INFO - __main__ - Step 12275: {'lr': 0.000494078340111848, 'samples': 2356800, 'steps': 12274, 'loss/train': 1.8969393968582153} +11/06/2021 22:56:43 - INFO - __main__ - Step 12276: {'lr': 0.0004940771918826298, 'samples': 2356992, 'steps': 12275, 'loss/train': 1.4344086647033691} +11/06/2021 22:56:44 - INFO - __main__ - Step 12277: {'lr': 0.0004940760435434341, 'samples': 2357184, 'steps': 12276, 'loss/train': 1.9090864658355713} +11/06/2021 22:56:45 - INFO - __main__ - Step 12278: {'lr': 0.0004940748950942618, 'samples': 2357376, 'steps': 12277, 'loss/train': 1.6862670183181763} +11/06/2021 22:56:45 - INFO - __main__ - Step 12279: {'lr': 0.0004940737465351128, 'samples': 2357568, 'steps': 12278, 'loss/train': 1.9722408056259155} +11/06/2021 22:56:45 - INFO - __main__ - Step 12280: {'lr': 0.0004940725978659881, 'samples': 2357760, 'steps': 12279, 'loss/train': 1.9200348854064941} +11/06/2021 22:56:46 - INFO - __main__ - Step 12281: {'lr': 0.000494071449086888, 'samples': 2357952, 'steps': 12280, 'loss/train': 1.9199883937835693} +11/06/2021 22:56:47 - INFO - __main__ - Step 12282: {'lr': 0.0004940703001978131, 'samples': 2358144, 'steps': 12281, 'loss/train': 1.2483066320419312} +11/06/2021 22:56:47 - INFO - __main__ - Step 12283: {'lr': 0.0004940691511987639, 'samples': 2358336, 'steps': 12282, 'loss/train': 1.7513079643249512} +11/06/2021 22:56:47 - INFO - __main__ - Step 12284: {'lr': 0.0004940680020897409, 'samples': 2358528, 'steps': 12283, 'loss/train': 5.813735485076904} +11/06/2021 22:56:48 - INFO - __main__ - Step 12285: {'lr': 0.0004940668528707446, 'samples': 2358720, 'steps': 12284, 'loss/train': 1.4615005254745483} +11/06/2021 22:56:48 - INFO - __main__ - Step 12286: {'lr': 0.0004940657035417755, 'samples': 2358912, 'steps': 12285, 'loss/train': 2.1803793907165527} +11/06/2021 22:56:49 - INFO - __main__ - Step 12287: {'lr': 0.0004940645541028343, 'samples': 2359104, 'steps': 12286, 'loss/train': 3.126666307449341} +11/06/2021 22:56:50 - INFO - __main__ - Step 12288: {'lr': 0.0004940634045539213, 'samples': 2359296, 'steps': 12287, 'loss/train': 1.47324800491333} +11/06/2021 22:56:50 - INFO - __main__ - Step 12289: {'lr': 0.000494062254895037, 'samples': 2359488, 'steps': 12288, 'loss/train': 1.7035387754440308} +11/06/2021 22:56:50 - INFO - __main__ - Step 12290: {'lr': 0.0004940611051261822, 'samples': 2359680, 'steps': 12289, 'loss/train': 1.6604784727096558} +11/06/2021 22:56:51 - INFO - __main__ - Step 12291: {'lr': 0.000494059955247357, 'samples': 2359872, 'steps': 12290, 'loss/train': 1.833449125289917} +11/06/2021 22:56:51 - INFO - __main__ - Step 12292: {'lr': 0.0004940588052585624, 'samples': 2360064, 'steps': 12291, 'loss/train': 1.7617274522781372} +11/06/2021 22:56:52 - INFO - __main__ - Step 12293: {'lr': 0.0004940576551597985, 'samples': 2360256, 'steps': 12292, 'loss/train': 1.5269970893859863} +11/06/2021 22:56:52 - INFO - __main__ - Step 12294: {'lr': 0.000494056504951066, 'samples': 2360448, 'steps': 12293, 'loss/train': 0.993115246295929} +11/06/2021 22:56:53 - INFO - __main__ - Step 12295: {'lr': 0.0004940553546323655, 'samples': 2360640, 'steps': 12294, 'loss/train': 1.4290341138839722} +11/06/2021 22:56:53 - INFO - __main__ - Step 12296: {'lr': 0.0004940542042036974, 'samples': 2360832, 'steps': 12295, 'loss/train': 1.7313815355300903} +11/06/2021 22:56:53 - INFO - __main__ - Step 12297: {'lr': 0.0004940530536650621, 'samples': 2361024, 'steps': 12296, 'loss/train': 1.907927393913269} +11/06/2021 22:56:54 - INFO - __main__ - Step 12298: {'lr': 0.0004940519030164605, 'samples': 2361216, 'steps': 12297, 'loss/train': 1.4239506721496582} +11/06/2021 22:56:55 - INFO - __main__ - Step 12299: {'lr': 0.0004940507522578927, 'samples': 2361408, 'steps': 12298, 'loss/train': 2.017463207244873} +11/06/2021 22:56:55 - INFO - __main__ - Step 12300: {'lr': 0.0004940496013893594, 'samples': 2361600, 'steps': 12299, 'loss/train': 1.8298779726028442} +11/06/2021 22:56:55 - INFO - __main__ - Step 12301: {'lr': 0.0004940484504108612, 'samples': 2361792, 'steps': 12300, 'loss/train': 1.4371073246002197} +11/06/2021 22:56:56 - INFO - __main__ - Step 12302: {'lr': 0.0004940472993223985, 'samples': 2361984, 'steps': 12301, 'loss/train': 1.8154419660568237} +11/06/2021 22:56:56 - INFO - __main__ - Step 12303: {'lr': 0.0004940461481239719, 'samples': 2362176, 'steps': 12302, 'loss/train': 1.6027586460113525} +11/06/2021 22:56:57 - INFO - __main__ - Step 12304: {'lr': 0.0004940449968155818, 'samples': 2362368, 'steps': 12303, 'loss/train': 2.39496111869812} +11/06/2021 22:56:58 - INFO - __main__ - Step 12305: {'lr': 0.0004940438453972288, 'samples': 2362560, 'steps': 12304, 'loss/train': 1.6671775579452515} +11/06/2021 22:56:58 - INFO - __main__ - Step 12306: {'lr': 0.0004940426938689135, 'samples': 2362752, 'steps': 12305, 'loss/train': 1.91392183303833} +11/06/2021 22:56:58 - INFO - __main__ - Step 12307: {'lr': 0.0004940415422306361, 'samples': 2362944, 'steps': 12306, 'loss/train': 1.1845285892486572} +11/06/2021 22:56:59 - INFO - __main__ - Step 12308: {'lr': 0.0004940403904823976, 'samples': 2363136, 'steps': 12307, 'loss/train': 1.8613651990890503} +11/06/2021 22:57:00 - INFO - __main__ - Step 12309: {'lr': 0.0004940392386241981, 'samples': 2363328, 'steps': 12308, 'loss/train': 2.2593603134155273} +11/06/2021 22:57:00 - INFO - __main__ - Step 12310: {'lr': 0.0004940380866560384, 'samples': 2363520, 'steps': 12309, 'loss/train': 1.829590916633606} +11/06/2021 22:57:00 - INFO - __main__ - Step 12311: {'lr': 0.0004940369345779187, 'samples': 2363712, 'steps': 12310, 'loss/train': 1.535210371017456} +11/06/2021 22:57:01 - INFO - __main__ - Step 12312: {'lr': 0.00049403578238984, 'samples': 2363904, 'steps': 12311, 'loss/train': 1.498138189315796} +11/06/2021 22:57:01 - INFO - __main__ - Step 12313: {'lr': 0.0004940346300918024, 'samples': 2364096, 'steps': 12312, 'loss/train': 1.6373891830444336} +11/06/2021 22:57:02 - INFO - __main__ - Step 12314: {'lr': 0.0004940334776838065, 'samples': 2364288, 'steps': 12313, 'loss/train': 2.0152111053466797} +11/06/2021 22:57:02 - INFO - __main__ - Step 12315: {'lr': 0.000494032325165853, 'samples': 2364480, 'steps': 12314, 'loss/train': 1.4806876182556152} +11/06/2021 22:57:03 - INFO - __main__ - Step 12316: {'lr': 0.0004940311725379423, 'samples': 2364672, 'steps': 12315, 'loss/train': 1.7899569272994995} +11/06/2021 22:57:03 - INFO - __main__ - Step 12317: {'lr': 0.0004940300198000748, 'samples': 2364864, 'steps': 12316, 'loss/train': 1.8684685230255127} +11/06/2021 22:57:03 - INFO - __main__ - Step 12318: {'lr': 0.0004940288669522513, 'samples': 2365056, 'steps': 12317, 'loss/train': 1.5197453498840332} +11/06/2021 22:57:05 - INFO - __main__ - Step 12319: {'lr': 0.000494027713994472, 'samples': 2365248, 'steps': 12318, 'loss/train': 1.7379388809204102} +11/06/2021 22:57:05 - INFO - __main__ - Step 12320: {'lr': 0.0004940265609267377, 'samples': 2365440, 'steps': 12319, 'loss/train': 1.384351372718811} +11/06/2021 22:57:05 - INFO - __main__ - Step 12321: {'lr': 0.0004940254077490487, 'samples': 2365632, 'steps': 12320, 'loss/train': 2.0284841060638428} +11/06/2021 22:57:06 - INFO - __main__ - Step 12322: {'lr': 0.0004940242544614056, 'samples': 2365824, 'steps': 12321, 'loss/train': 1.541722297668457} +11/06/2021 22:57:06 - INFO - __main__ - Step 12323: {'lr': 0.0004940231010638091, 'samples': 2366016, 'steps': 12322, 'loss/train': 1.9831137657165527} +11/06/2021 22:57:07 - INFO - __main__ - Step 12324: {'lr': 0.0004940219475562593, 'samples': 2366208, 'steps': 12323, 'loss/train': 0.3079480528831482} +11/06/2021 22:57:08 - INFO - __main__ - Step 12325: {'lr': 0.0004940207939387573, 'samples': 2366400, 'steps': 12324, 'loss/train': 1.5259820222854614} +11/06/2021 22:57:08 - INFO - __main__ - Step 12326: {'lr': 0.0004940196402113031, 'samples': 2366592, 'steps': 12325, 'loss/train': 1.683254361152649} +11/06/2021 22:57:08 - INFO - __main__ - Step 12327: {'lr': 0.0004940184863738975, 'samples': 2366784, 'steps': 12326, 'loss/train': 1.8076988458633423} +11/06/2021 22:57:09 - INFO - __main__ - Step 12328: {'lr': 0.0004940173324265407, 'samples': 2366976, 'steps': 12327, 'loss/train': 1.4422165155410767} +11/06/2021 22:57:10 - INFO - __main__ - Step 12329: {'lr': 0.0004940161783692338, 'samples': 2367168, 'steps': 12328, 'loss/train': 1.9659552574157715} +11/06/2021 22:57:10 - INFO - __main__ - Step 12330: {'lr': 0.0004940150242019768, 'samples': 2367360, 'steps': 12329, 'loss/train': 1.24222731590271} +11/06/2021 22:57:11 - INFO - __main__ - Step 12331: {'lr': 0.0004940138699247704, 'samples': 2367552, 'steps': 12330, 'loss/train': 2.182091474533081} +11/06/2021 22:57:11 - INFO - __main__ - Step 12332: {'lr': 0.0004940127155376151, 'samples': 2367744, 'steps': 12331, 'loss/train': 1.8635755777359009} +11/06/2021 22:57:11 - INFO - __main__ - Step 12333: {'lr': 0.0004940115610405114, 'samples': 2367936, 'steps': 12332, 'loss/train': 1.9940561056137085} +11/06/2021 22:57:12 - INFO - __main__ - Step 12334: {'lr': 0.0004940104064334599, 'samples': 2368128, 'steps': 12333, 'loss/train': 1.4782226085662842} +11/06/2021 22:57:12 - INFO - __main__ - Step 12335: {'lr': 0.0004940092517164612, 'samples': 2368320, 'steps': 12334, 'loss/train': 1.205909252166748} +11/06/2021 22:57:13 - INFO - __main__ - Step 12336: {'lr': 0.0004940080968895155, 'samples': 2368512, 'steps': 12335, 'loss/train': 2.1496191024780273} +11/06/2021 22:57:13 - INFO - __main__ - Step 12337: {'lr': 0.0004940069419526236, 'samples': 2368704, 'steps': 12336, 'loss/train': 1.5507055521011353} +11/06/2021 22:57:14 - INFO - __main__ - Step 12338: {'lr': 0.0004940057869057859, 'samples': 2368896, 'steps': 12337, 'loss/train': 0.8827195763587952} +11/06/2021 22:57:14 - INFO - __main__ - Step 12339: {'lr': 0.000494004631749003, 'samples': 2369088, 'steps': 12338, 'loss/train': 1.7027802467346191} +11/06/2021 22:57:14 - INFO - __main__ - Step 12340: {'lr': 0.0004940034764822754, 'samples': 2369280, 'steps': 12339, 'loss/train': 1.6618696451187134} +11/06/2021 22:57:15 - INFO - __main__ - Step 12341: {'lr': 0.0004940023211056036, 'samples': 2369472, 'steps': 12340, 'loss/train': 1.9544622898101807} +11/06/2021 22:57:16 - INFO - __main__ - Step 12342: {'lr': 0.0004940011656189881, 'samples': 2369664, 'steps': 12341, 'loss/train': 1.8119089603424072} +11/06/2021 22:57:16 - INFO - __main__ - Step 12343: {'lr': 0.0004940000100224295, 'samples': 2369856, 'steps': 12342, 'loss/train': 1.2512726783752441} +11/06/2021 22:57:17 - INFO - __main__ - Step 12344: {'lr': 0.0004939988543159282, 'samples': 2370048, 'steps': 12343, 'loss/train': 1.5961833000183105} +11/06/2021 22:57:17 - INFO - __main__ - Step 12345: {'lr': 0.0004939976984994847, 'samples': 2370240, 'steps': 12344, 'loss/train': 1.501064419746399} +11/06/2021 22:57:18 - INFO - __main__ - Step 12346: {'lr': 0.0004939965425730996, 'samples': 2370432, 'steps': 12345, 'loss/train': 1.6873294115066528} +11/06/2021 22:57:18 - INFO - __main__ - Step 12347: {'lr': 0.0004939953865367735, 'samples': 2370624, 'steps': 12346, 'loss/train': 1.1613168716430664} +11/06/2021 22:57:19 - INFO - __main__ - Step 12348: {'lr': 0.0004939942303905069, 'samples': 2370816, 'steps': 12347, 'loss/train': 1.5683062076568604} +11/06/2021 22:57:19 - INFO - __main__ - Step 12349: {'lr': 0.0004939930741343002, 'samples': 2371008, 'steps': 12348, 'loss/train': 1.0350655317306519} +11/06/2021 22:57:19 - INFO - __main__ - Step 12350: {'lr': 0.000493991917768154, 'samples': 2371200, 'steps': 12349, 'loss/train': 1.5559569597244263} +11/06/2021 22:57:20 - INFO - __main__ - Step 12351: {'lr': 0.0004939907612920688, 'samples': 2371392, 'steps': 12350, 'loss/train': 1.799564003944397} +11/06/2021 22:57:21 - INFO - __main__ - Step 12352: {'lr': 0.0004939896047060451, 'samples': 2371584, 'steps': 12351, 'loss/train': 1.0660388469696045} +11/06/2021 22:57:21 - INFO - __main__ - Step 12353: {'lr': 0.0004939884480100836, 'samples': 2371776, 'steps': 12352, 'loss/train': 1.4161072969436646} +11/06/2021 22:57:21 - INFO - __main__ - Step 12354: {'lr': 0.0004939872912041844, 'samples': 2371968, 'steps': 12353, 'loss/train': 1.7622441053390503} +11/06/2021 22:57:22 - INFO - __main__ - Step 12355: {'lr': 0.0004939861342883485, 'samples': 2372160, 'steps': 12354, 'loss/train': 1.4472774267196655} +11/06/2021 22:57:22 - INFO - __main__ - Step 12356: {'lr': 0.0004939849772625761, 'samples': 2372352, 'steps': 12355, 'loss/train': 1.7829986810684204} +11/06/2021 22:57:23 - INFO - __main__ - Step 12357: {'lr': 0.0004939838201268679, 'samples': 2372544, 'steps': 12356, 'loss/train': 2.1662769317626953} +11/06/2021 22:57:24 - INFO - __main__ - Step 12358: {'lr': 0.0004939826628812244, 'samples': 2372736, 'steps': 12357, 'loss/train': 1.5202739238739014} +11/06/2021 22:57:24 - INFO - __main__ - Step 12359: {'lr': 0.000493981505525646, 'samples': 2372928, 'steps': 12358, 'loss/train': 1.9102394580841064} +11/06/2021 22:57:24 - INFO - __main__ - Step 12360: {'lr': 0.0004939803480601333, 'samples': 2373120, 'steps': 12359, 'loss/train': 1.4958027601242065} +11/06/2021 22:57:25 - INFO - __main__ - Step 12361: {'lr': 0.0004939791904846869, 'samples': 2373312, 'steps': 12360, 'loss/train': 1.0917266607284546} +11/06/2021 22:57:26 - INFO - __main__ - Step 12362: {'lr': 0.0004939780327993072, 'samples': 2373504, 'steps': 12361, 'loss/train': 1.7016918659210205} +11/06/2021 22:57:26 - INFO - __main__ - Step 12363: {'lr': 0.0004939768750039946, 'samples': 2373696, 'steps': 12362, 'loss/train': 1.3413039445877075} +11/06/2021 22:57:26 - INFO - __main__ - Step 12364: {'lr': 0.00049397571709875, 'samples': 2373888, 'steps': 12363, 'loss/train': 2.0355639457702637} +11/06/2021 22:57:27 - INFO - __main__ - Step 12365: {'lr': 0.0004939745590835736, 'samples': 2374080, 'steps': 12364, 'loss/train': 2.2837467193603516} +11/06/2021 22:57:27 - INFO - __main__ - Step 12366: {'lr': 0.0004939734009584661, 'samples': 2374272, 'steps': 12365, 'loss/train': 2.075040578842163} +11/06/2021 22:57:28 - INFO - __main__ - Step 12367: {'lr': 0.0004939722427234279, 'samples': 2374464, 'steps': 12366, 'loss/train': 1.9329279661178589} +11/06/2021 22:57:28 - INFO - __main__ - Step 12368: {'lr': 0.0004939710843784596, 'samples': 2374656, 'steps': 12367, 'loss/train': 1.624833106994629} +11/06/2021 22:57:29 - INFO - __main__ - Step 12369: {'lr': 0.0004939699259235617, 'samples': 2374848, 'steps': 12368, 'loss/train': 1.8931273221969604} +11/06/2021 22:57:29 - INFO - __main__ - Step 12370: {'lr': 0.0004939687673587346, 'samples': 2375040, 'steps': 12369, 'loss/train': 1.79799222946167} +11/06/2021 22:57:29 - INFO - __main__ - Step 12371: {'lr': 0.0004939676086839791, 'samples': 2375232, 'steps': 12370, 'loss/train': 1.7580457925796509} +11/06/2021 22:57:30 - INFO - __main__ - Step 12372: {'lr': 0.0004939664498992955, 'samples': 2375424, 'steps': 12371, 'loss/train': 1.5857473611831665} +11/06/2021 22:57:31 - INFO - __main__ - Step 12373: {'lr': 0.0004939652910046844, 'samples': 2375616, 'steps': 12372, 'loss/train': 1.6514397859573364} +11/06/2021 22:57:31 - INFO - __main__ - Step 12374: {'lr': 0.0004939641320001462, 'samples': 2375808, 'steps': 12373, 'loss/train': 1.8684816360473633} +11/06/2021 22:57:31 - INFO - __main__ - Step 12375: {'lr': 0.0004939629728856817, 'samples': 2376000, 'steps': 12374, 'loss/train': 1.2412973642349243} +11/06/2021 22:57:32 - INFO - __main__ - Step 12376: {'lr': 0.0004939618136612911, 'samples': 2376192, 'steps': 12375, 'loss/train': 1.7167083024978638} +11/06/2021 22:57:33 - INFO - __main__ - Step 12377: {'lr': 0.0004939606543269751, 'samples': 2376384, 'steps': 12376, 'loss/train': 1.4133563041687012} +11/06/2021 22:57:33 - INFO - __main__ - Step 12378: {'lr': 0.0004939594948827343, 'samples': 2376576, 'steps': 12377, 'loss/train': 1.8891206979751587} +11/06/2021 22:57:34 - INFO - __main__ - Step 12379: {'lr': 0.000493958335328569, 'samples': 2376768, 'steps': 12378, 'loss/train': 1.7850967645645142} +11/06/2021 22:57:34 - INFO - __main__ - Step 12380: {'lr': 0.0004939571756644799, 'samples': 2376960, 'steps': 12379, 'loss/train': 1.6386349201202393} +11/06/2021 22:57:34 - INFO - __main__ - Step 12381: {'lr': 0.0004939560158904675, 'samples': 2377152, 'steps': 12380, 'loss/train': 0.9704276323318481} +11/06/2021 22:57:36 - INFO - __main__ - Step 12382: {'lr': 0.0004939548560065322, 'samples': 2377344, 'steps': 12381, 'loss/train': 1.7817976474761963} +11/06/2021 22:57:36 - INFO - __main__ - Step 12383: {'lr': 0.0004939536960126746, 'samples': 2377536, 'steps': 12382, 'loss/train': 1.5621471405029297} +11/06/2021 22:57:37 - INFO - __main__ - Step 12384: {'lr': 0.0004939525359088953, 'samples': 2377728, 'steps': 12383, 'loss/train': 1.8215516805648804} +11/06/2021 22:57:37 - INFO - __main__ - Step 12385: {'lr': 0.0004939513756951946, 'samples': 2377920, 'steps': 12384, 'loss/train': 1.7546138763427734} +11/06/2021 22:57:37 - INFO - __main__ - Step 12386: {'lr': 0.0004939502153715733, 'samples': 2378112, 'steps': 12385, 'loss/train': 1.881219744682312} +11/06/2021 22:57:38 - INFO - __main__ - Step 12387: {'lr': 0.0004939490549380318, 'samples': 2378304, 'steps': 12386, 'loss/train': 2.4455485343933105} +11/06/2021 22:57:38 - INFO - __main__ - Step 12388: {'lr': 0.0004939478943945706, 'samples': 2378496, 'steps': 12387, 'loss/train': 1.8239833116531372} +11/06/2021 22:57:39 - INFO - __main__ - Step 12389: {'lr': 0.0004939467337411903, 'samples': 2378688, 'steps': 12388, 'loss/train': 1.7355788946151733} +11/06/2021 22:57:39 - INFO - __main__ - Step 12390: {'lr': 0.0004939455729778912, 'samples': 2378880, 'steps': 12389, 'loss/train': 1.7384986877441406} +11/06/2021 22:57:40 - INFO - __main__ - Step 12391: {'lr': 0.0004939444121046741, 'samples': 2379072, 'steps': 12390, 'loss/train': 1.171319603919983} +11/06/2021 22:57:40 - INFO - __main__ - Step 12392: {'lr': 0.0004939432511215395, 'samples': 2379264, 'steps': 12391, 'loss/train': 1.6471529006958008} +11/06/2021 22:57:40 - INFO - __main__ - Step 12393: {'lr': 0.0004939420900284876, 'samples': 2379456, 'steps': 12392, 'loss/train': 1.4227564334869385} +11/06/2021 22:57:41 - INFO - __main__ - Step 12394: {'lr': 0.0004939409288255194, 'samples': 2379648, 'steps': 12393, 'loss/train': 1.9644057750701904} +11/06/2021 22:57:42 - INFO - __main__ - Step 12395: {'lr': 0.000493939767512635, 'samples': 2379840, 'steps': 12394, 'loss/train': 1.767325758934021} +11/06/2021 22:57:42 - INFO - __main__ - Step 12396: {'lr': 0.0004939386060898353, 'samples': 2380032, 'steps': 12395, 'loss/train': 2.075618267059326} +11/06/2021 22:57:42 - INFO - __main__ - Step 12397: {'lr': 0.0004939374445571206, 'samples': 2380224, 'steps': 12396, 'loss/train': 1.4473564624786377} +11/06/2021 22:57:43 - INFO - __main__ - Step 12398: {'lr': 0.0004939362829144913, 'samples': 2380416, 'steps': 12397, 'loss/train': 1.165976643562317} +11/06/2021 22:57:44 - INFO - __main__ - Step 12399: {'lr': 0.0004939351211619481, 'samples': 2380608, 'steps': 12398, 'loss/train': 2.2611637115478516} +11/06/2021 22:57:44 - INFO - __main__ - Step 12400: {'lr': 0.0004939339592994916, 'samples': 2380800, 'steps': 12399, 'loss/train': 2.222313165664673} +11/06/2021 22:57:45 - INFO - __main__ - Step 12401: {'lr': 0.0004939327973271222, 'samples': 2380992, 'steps': 12400, 'loss/train': 1.8177175521850586} +11/06/2021 22:57:45 - INFO - __main__ - Step 12402: {'lr': 0.0004939316352448403, 'samples': 2381184, 'steps': 12401, 'loss/train': 1.0791970491409302} +11/06/2021 22:57:45 - INFO - __main__ - Step 12403: {'lr': 0.0004939304730526467, 'samples': 2381376, 'steps': 12402, 'loss/train': 1.8736491203308105} +11/06/2021 22:57:46 - INFO - __main__ - Step 12404: {'lr': 0.0004939293107505418, 'samples': 2381568, 'steps': 12403, 'loss/train': 2.0087807178497314} +11/06/2021 22:57:47 - INFO - __main__ - Step 12405: {'lr': 0.0004939281483385261, 'samples': 2381760, 'steps': 12404, 'loss/train': 1.4684945344924927} +11/06/2021 22:57:47 - INFO - __main__ - Step 12406: {'lr': 0.0004939269858166001, 'samples': 2381952, 'steps': 12405, 'loss/train': 1.8479887247085571} +11/06/2021 22:57:47 - INFO - __main__ - Step 12407: {'lr': 0.0004939258231847644, 'samples': 2382144, 'steps': 12406, 'loss/train': 1.5185550451278687} +11/06/2021 22:57:48 - INFO - __main__ - Step 12408: {'lr': 0.0004939246604430195, 'samples': 2382336, 'steps': 12407, 'loss/train': 1.8069547414779663} +11/06/2021 22:57:48 - INFO - __main__ - Step 12409: {'lr': 0.0004939234975913659, 'samples': 2382528, 'steps': 12408, 'loss/train': 1.5137650966644287} +11/06/2021 22:57:49 - INFO - __main__ - Step 12410: {'lr': 0.0004939223346298042, 'samples': 2382720, 'steps': 12409, 'loss/train': 0.2782944142818451} +11/06/2021 22:57:50 - INFO - __main__ - Step 12411: {'lr': 0.0004939211715583347, 'samples': 2382912, 'steps': 12410, 'loss/train': 1.9376318454742432} +11/06/2021 22:57:50 - INFO - __main__ - Step 12412: {'lr': 0.0004939200083769582, 'samples': 2383104, 'steps': 12411, 'loss/train': 1.265969157218933} +11/06/2021 22:57:50 - INFO - __main__ - Step 12413: {'lr': 0.000493918845085675, 'samples': 2383296, 'steps': 12412, 'loss/train': 1.7577980756759644} +11/06/2021 22:57:51 - INFO - __main__ - Step 12414: {'lr': 0.000493917681684486, 'samples': 2383488, 'steps': 12413, 'loss/train': 0.3489714562892914} +11/06/2021 22:57:52 - INFO - __main__ - Step 12415: {'lr': 0.0004939165181733911, 'samples': 2383680, 'steps': 12414, 'loss/train': 1.9580268859863281} +11/06/2021 22:57:52 - INFO - __main__ - Step 12416: {'lr': 0.0004939153545523914, 'samples': 2383872, 'steps': 12415, 'loss/train': 1.4286139011383057} +11/06/2021 22:57:52 - INFO - __main__ - Step 12417: {'lr': 0.0004939141908214871, 'samples': 2384064, 'steps': 12416, 'loss/train': 1.9150186777114868} +11/06/2021 22:57:53 - INFO - __main__ - Step 12418: {'lr': 0.000493913026980679, 'samples': 2384256, 'steps': 12417, 'loss/train': 1.4130078554153442} +11/06/2021 22:57:53 - INFO - __main__ - Step 12419: {'lr': 0.0004939118630299672, 'samples': 2384448, 'steps': 12418, 'loss/train': 1.799317479133606} +11/06/2021 22:57:54 - INFO - __main__ - Step 12420: {'lr': 0.0004939106989693527, 'samples': 2384640, 'steps': 12419, 'loss/train': 2.154881477355957} +11/06/2021 22:57:55 - INFO - __main__ - Step 12421: {'lr': 0.0004939095347988357, 'samples': 2384832, 'steps': 12420, 'loss/train': 1.9314367771148682} +11/06/2021 22:57:55 - INFO - __main__ - Step 12422: {'lr': 0.0004939083705184169, 'samples': 2385024, 'steps': 12421, 'loss/train': 1.7732396125793457} +11/06/2021 22:57:55 - INFO - __main__ - Step 12423: {'lr': 0.0004939072061280967, 'samples': 2385216, 'steps': 12422, 'loss/train': 1.4663667678833008} +11/06/2021 22:57:56 - INFO - __main__ - Step 12424: {'lr': 0.0004939060416278756, 'samples': 2385408, 'steps': 12423, 'loss/train': 1.8774303197860718} +11/06/2021 22:57:57 - INFO - __main__ - Step 12425: {'lr': 0.0004939048770177543, 'samples': 2385600, 'steps': 12424, 'loss/train': 1.5539430379867554} +11/06/2021 22:57:57 - INFO - __main__ - Step 12426: {'lr': 0.0004939037122977332, 'samples': 2385792, 'steps': 12425, 'loss/train': 1.527437448501587} +11/06/2021 22:57:57 - INFO - __main__ - Step 12427: {'lr': 0.0004939025474678129, 'samples': 2385984, 'steps': 12426, 'loss/train': 1.8269412517547607} +11/06/2021 22:57:58 - INFO - __main__ - Step 12428: {'lr': 0.0004939013825279939, 'samples': 2386176, 'steps': 12427, 'loss/train': 1.5649765729904175} +11/06/2021 22:57:58 - INFO - __main__ - Step 12429: {'lr': 0.0004939002174782766, 'samples': 2386368, 'steps': 12428, 'loss/train': 0.8925514221191406} +11/06/2021 22:57:59 - INFO - __main__ - Step 12430: {'lr': 0.0004938990523186616, 'samples': 2386560, 'steps': 12429, 'loss/train': 0.6605421304702759} +11/06/2021 22:57:59 - INFO - __main__ - Step 12431: {'lr': 0.0004938978870491495, 'samples': 2386752, 'steps': 12430, 'loss/train': 1.8025730848312378} +11/06/2021 22:58:00 - INFO - __main__ - Step 12432: {'lr': 0.0004938967216697409, 'samples': 2386944, 'steps': 12431, 'loss/train': 1.7200829982757568} +11/06/2021 22:58:00 - INFO - __main__ - Step 12433: {'lr': 0.0004938955561804361, 'samples': 2387136, 'steps': 12432, 'loss/train': 1.6927978992462158} +11/06/2021 22:58:00 - INFO - __main__ - Step 12434: {'lr': 0.0004938943905812357, 'samples': 2387328, 'steps': 12433, 'loss/train': 1.6915475130081177} +11/06/2021 22:58:02 - INFO - __main__ - Step 12435: {'lr': 0.0004938932248721401, 'samples': 2387520, 'steps': 12434, 'loss/train': 1.565805196762085} +11/06/2021 22:58:02 - INFO - __main__ - Step 12436: {'lr': 0.0004938920590531503, 'samples': 2387712, 'steps': 12435, 'loss/train': 1.8280435800552368} +11/06/2021 22:58:02 - INFO - __main__ - Step 12437: {'lr': 0.0004938908931242663, 'samples': 2387904, 'steps': 12436, 'loss/train': 1.499329924583435} +11/06/2021 22:58:03 - INFO - __main__ - Step 12438: {'lr': 0.0004938897270854889, 'samples': 2388096, 'steps': 12437, 'loss/train': 0.8522184491157532} +11/06/2021 22:58:03 - INFO - __main__ - Step 12439: {'lr': 0.0004938885609368184, 'samples': 2388288, 'steps': 12438, 'loss/train': 1.0399724245071411} +11/06/2021 22:58:03 - INFO - __main__ - Step 12440: {'lr': 0.0004938873946782557, 'samples': 2388480, 'steps': 12439, 'loss/train': 1.3930256366729736} +11/06/2021 22:58:04 - INFO - __main__ - Step 12441: {'lr': 0.000493886228309801, 'samples': 2388672, 'steps': 12440, 'loss/train': 2.077786922454834} +11/06/2021 22:58:05 - INFO - __main__ - Step 12442: {'lr': 0.0004938850618314549, 'samples': 2388864, 'steps': 12441, 'loss/train': 1.7731544971466064} +11/06/2021 22:58:05 - INFO - __main__ - Step 12443: {'lr': 0.000493883895243218, 'samples': 2389056, 'steps': 12442, 'loss/train': 1.930917501449585} +11/06/2021 22:58:05 - INFO - __main__ - Step 12444: {'lr': 0.0004938827285450908, 'samples': 2389248, 'steps': 12443, 'loss/train': 1.6230531930923462} +11/06/2021 22:58:06 - INFO - __main__ - Step 12445: {'lr': 0.0004938815617370737, 'samples': 2389440, 'steps': 12444, 'loss/train': 1.7806710004806519} +11/06/2021 22:58:07 - INFO - __main__ - Step 12446: {'lr': 0.0004938803948191674, 'samples': 2389632, 'steps': 12445, 'loss/train': 1.8226611614227295} +11/06/2021 22:58:07 - INFO - __main__ - Step 12447: {'lr': 0.0004938792277913724, 'samples': 2389824, 'steps': 12446, 'loss/train': 1.6907552480697632} +11/06/2021 22:58:07 - INFO - __main__ - Step 12448: {'lr': 0.0004938780606536891, 'samples': 2390016, 'steps': 12447, 'loss/train': 1.9399850368499756} +11/06/2021 22:58:08 - INFO - __main__ - Step 12449: {'lr': 0.0004938768934061182, 'samples': 2390208, 'steps': 12448, 'loss/train': 1.9037350416183472} +11/06/2021 22:58:08 - INFO - __main__ - Step 12450: {'lr': 0.0004938757260486601, 'samples': 2390400, 'steps': 12449, 'loss/train': 1.6695767641067505} +11/06/2021 22:58:09 - INFO - __main__ - Step 12451: {'lr': 0.0004938745585813153, 'samples': 2390592, 'steps': 12450, 'loss/train': 1.9863166809082031} +11/06/2021 22:58:09 - INFO - __main__ - Step 12452: {'lr': 0.0004938733910040845, 'samples': 2390784, 'steps': 12451, 'loss/train': 1.697218418121338} +11/06/2021 22:58:10 - INFO - __main__ - Step 12453: {'lr': 0.000493872223316968, 'samples': 2390976, 'steps': 12452, 'loss/train': 1.4199427366256714} +11/06/2021 22:58:10 - INFO - __main__ - Step 12454: {'lr': 0.0004938710555199664, 'samples': 2391168, 'steps': 12453, 'loss/train': 1.2885547876358032} +11/06/2021 22:58:10 - INFO - __main__ - Step 12455: {'lr': 0.0004938698876130804, 'samples': 2391360, 'steps': 12454, 'loss/train': 1.8421812057495117} +11/06/2021 22:58:12 - INFO - __main__ - Step 12456: {'lr': 0.0004938687195963104, 'samples': 2391552, 'steps': 12455, 'loss/train': 1.8967642784118652} +11/06/2021 22:58:12 - INFO - __main__ - Step 12457: {'lr': 0.0004938675514696569, 'samples': 2391744, 'steps': 12456, 'loss/train': 0.5866230726242065} +11/06/2021 22:58:12 - INFO - __main__ - Step 12458: {'lr': 0.0004938663832331204, 'samples': 2391936, 'steps': 12457, 'loss/train': 1.3953553438186646} +11/06/2021 22:58:13 - INFO - __main__ - Step 12459: {'lr': 0.0004938652148867014, 'samples': 2392128, 'steps': 12458, 'loss/train': 0.3347637355327606} +11/06/2021 22:58:13 - INFO - __main__ - Step 12460: {'lr': 0.0004938640464304006, 'samples': 2392320, 'steps': 12459, 'loss/train': 1.7510279417037964} +11/06/2021 22:58:14 - INFO - __main__ - Step 12461: {'lr': 0.0004938628778642185, 'samples': 2392512, 'steps': 12460, 'loss/train': 1.7119464874267578} +11/06/2021 22:58:15 - INFO - __main__ - Step 12462: {'lr': 0.0004938617091881554, 'samples': 2392704, 'steps': 12461, 'loss/train': 1.8808752298355103} +11/06/2021 22:58:15 - INFO - __main__ - Step 12463: {'lr': 0.000493860540402212, 'samples': 2392896, 'steps': 12462, 'loss/train': 1.534140706062317} +11/06/2021 22:58:15 - INFO - __main__ - Step 12464: {'lr': 0.0004938593715063888, 'samples': 2393088, 'steps': 12463, 'loss/train': 1.430334448814392} +11/06/2021 22:58:16 - INFO - __main__ - Step 12465: {'lr': 0.0004938582025006864, 'samples': 2393280, 'steps': 12464, 'loss/train': 1.060693621635437} +11/06/2021 22:58:16 - INFO - __main__ - Step 12466: {'lr': 0.0004938570333851052, 'samples': 2393472, 'steps': 12465, 'loss/train': 1.7933906316757202} +11/06/2021 22:58:17 - INFO - __main__ - Step 12467: {'lr': 0.0004938558641596458, 'samples': 2393664, 'steps': 12466, 'loss/train': 0.8866246938705444} +11/06/2021 22:58:18 - INFO - __main__ - Step 12468: {'lr': 0.0004938546948243087, 'samples': 2393856, 'steps': 12467, 'loss/train': 1.1550602912902832} +11/06/2021 22:58:18 - INFO - __main__ - Step 12469: {'lr': 0.0004938535253790944, 'samples': 2394048, 'steps': 12468, 'loss/train': 1.569968342781067} +11/06/2021 22:58:18 - INFO - __main__ - Step 12470: {'lr': 0.0004938523558240035, 'samples': 2394240, 'steps': 12469, 'loss/train': 1.5518238544464111} +11/06/2021 22:58:19 - INFO - __main__ - Step 12471: {'lr': 0.0004938511861590365, 'samples': 2394432, 'steps': 12470, 'loss/train': 1.680008053779602} +11/06/2021 22:58:20 - INFO - __main__ - Step 12472: {'lr': 0.000493850016384194, 'samples': 2394624, 'steps': 12471, 'loss/train': 1.5120447874069214} +11/06/2021 22:58:20 - INFO - __main__ - Step 12473: {'lr': 0.0004938488464994764, 'samples': 2394816, 'steps': 12472, 'loss/train': 1.2448487281799316} +11/06/2021 22:58:20 - INFO - __main__ - Step 12474: {'lr': 0.0004938476765048842, 'samples': 2395008, 'steps': 12473, 'loss/train': 1.75505530834198} +11/06/2021 22:58:21 - INFO - __main__ - Step 12475: {'lr': 0.0004938465064004181, 'samples': 2395200, 'steps': 12474, 'loss/train': 1.4993715286254883} +11/06/2021 22:58:21 - INFO - __main__ - Step 12476: {'lr': 0.0004938453361860785, 'samples': 2395392, 'steps': 12475, 'loss/train': 1.6002764701843262} +11/06/2021 22:58:22 - INFO - __main__ - Step 12477: {'lr': 0.0004938441658618659, 'samples': 2395584, 'steps': 12476, 'loss/train': 1.6196297407150269} +11/06/2021 22:58:22 - INFO - __main__ - Step 12478: {'lr': 0.0004938429954277809, 'samples': 2395776, 'steps': 12477, 'loss/train': 1.990778923034668} +11/06/2021 22:58:23 - INFO - __main__ - Step 12479: {'lr': 0.000493841824883824, 'samples': 2395968, 'steps': 12478, 'loss/train': 1.7635631561279297} +11/06/2021 22:58:23 - INFO - __main__ - Step 12480: {'lr': 0.0004938406542299956, 'samples': 2396160, 'steps': 12479, 'loss/train': 1.3563812971115112} +11/06/2021 22:58:23 - INFO - __main__ - Step 12481: {'lr': 0.0004938394834662966, 'samples': 2396352, 'steps': 12480, 'loss/train': 0.9850826859474182} +11/06/2021 22:58:24 - INFO - __main__ - Step 12482: {'lr': 0.0004938383125927272, 'samples': 2396544, 'steps': 12481, 'loss/train': 1.9261223077774048} +11/06/2021 22:58:25 - INFO - __main__ - Step 12483: {'lr': 0.0004938371416092881, 'samples': 2396736, 'steps': 12482, 'loss/train': 1.8350012302398682} +11/06/2021 22:58:25 - INFO - __main__ - Step 12484: {'lr': 0.0004938359705159796, 'samples': 2396928, 'steps': 12483, 'loss/train': 1.5597666501998901} +11/06/2021 22:58:25 - INFO - __main__ - Step 12485: {'lr': 0.0004938347993128025, 'samples': 2397120, 'steps': 12484, 'loss/train': 1.588280439376831} +11/06/2021 22:58:26 - INFO - __main__ - Step 12486: {'lr': 0.0004938336279997571, 'samples': 2397312, 'steps': 12485, 'loss/train': 1.8706063032150269} +11/06/2021 22:58:27 - INFO - __main__ - Step 12487: {'lr': 0.0004938324565768441, 'samples': 2397504, 'steps': 12486, 'loss/train': 1.8012641668319702} +11/06/2021 22:58:27 - INFO - __main__ - Step 12488: {'lr': 0.0004938312850440639, 'samples': 2397696, 'steps': 12487, 'loss/train': 0.9766202569007874} +11/06/2021 22:58:28 - INFO - __main__ - Step 12489: {'lr': 0.0004938301134014172, 'samples': 2397888, 'steps': 12488, 'loss/train': 1.6374305486679077} +11/06/2021 22:58:28 - INFO - __main__ - Step 12490: {'lr': 0.0004938289416489042, 'samples': 2398080, 'steps': 12489, 'loss/train': 2.0924293994903564} +11/06/2021 22:58:28 - INFO - __main__ - Step 12491: {'lr': 0.0004938277697865259, 'samples': 2398272, 'steps': 12490, 'loss/train': 1.4682444334030151} +11/06/2021 22:58:29 - INFO - __main__ - Step 12492: {'lr': 0.0004938265978142824, 'samples': 2398464, 'steps': 12491, 'loss/train': 2.014890193939209} +11/06/2021 22:58:30 - INFO - __main__ - Step 12493: {'lr': 0.0004938254257321745, 'samples': 2398656, 'steps': 12492, 'loss/train': 1.3816254138946533} +11/06/2021 22:58:30 - INFO - __main__ - Step 12494: {'lr': 0.0004938242535402025, 'samples': 2398848, 'steps': 12493, 'loss/train': 1.4478893280029297} +11/06/2021 22:58:30 - INFO - __main__ - Step 12495: {'lr': 0.0004938230812383672, 'samples': 2399040, 'steps': 12494, 'loss/train': 4.631295680999756} +11/06/2021 22:58:31 - INFO - __main__ - Step 12496: {'lr': 0.0004938219088266688, 'samples': 2399232, 'steps': 12495, 'loss/train': 1.651924729347229} +11/06/2021 22:58:31 - INFO - __main__ - Step 12497: {'lr': 0.0004938207363051082, 'samples': 2399424, 'steps': 12496, 'loss/train': 1.7738444805145264} +11/06/2021 22:58:32 - INFO - __main__ - Step 12498: {'lr': 0.0004938195636736857, 'samples': 2399616, 'steps': 12497, 'loss/train': 1.413539171218872} +11/06/2021 22:58:33 - INFO - __main__ - Step 12499: {'lr': 0.0004938183909324017, 'samples': 2399808, 'steps': 12498, 'loss/train': 1.9373109340667725} +11/06/2021 22:58:33 - INFO - __main__ - Step 12500: {'lr': 0.0004938172180812571, 'samples': 2400000, 'steps': 12499, 'loss/train': 2.0888149738311768} +11/06/2021 22:58:34 - INFO - __main__ - Step 12501: {'lr': 0.000493816045120252, 'samples': 2400192, 'steps': 12500, 'loss/train': 1.6998056173324585} +11/06/2021 22:58:34 - INFO - __main__ - Step 12502: {'lr': 0.0004938148720493873, 'samples': 2400384, 'steps': 12501, 'loss/train': 1.5378485918045044} +11/06/2021 22:58:35 - INFO - __main__ - Step 12503: {'lr': 0.0004938136988686634, 'samples': 2400576, 'steps': 12502, 'loss/train': 0.36686891317367554} +11/06/2021 22:58:35 - INFO - __main__ - Step 12504: {'lr': 0.0004938125255780808, 'samples': 2400768, 'steps': 12503, 'loss/train': 1.6974081993103027} +11/06/2021 22:58:36 - INFO - __main__ - Step 12505: {'lr': 0.0004938113521776401, 'samples': 2400960, 'steps': 12504, 'loss/train': 1.7452573776245117} +11/06/2021 22:58:36 - INFO - __main__ - Step 12506: {'lr': 0.0004938101786673416, 'samples': 2401152, 'steps': 12505, 'loss/train': 1.861094355583191} +11/06/2021 22:58:36 - INFO - __main__ - Step 12507: {'lr': 0.0004938090050471861, 'samples': 2401344, 'steps': 12506, 'loss/train': 1.3893704414367676} +11/06/2021 22:58:37 - INFO - __main__ - Step 12508: {'lr': 0.000493807831317174, 'samples': 2401536, 'steps': 12507, 'loss/train': 1.7757277488708496} +11/06/2021 22:58:38 - INFO - __main__ - Step 12509: {'lr': 0.0004938066574773058, 'samples': 2401728, 'steps': 12508, 'loss/train': 2.139897346496582} +11/06/2021 22:58:38 - INFO - __main__ - Step 12510: {'lr': 0.0004938054835275822, 'samples': 2401920, 'steps': 12509, 'loss/train': 1.3797563314437866} +11/06/2021 22:58:38 - INFO - __main__ - Step 12511: {'lr': 0.0004938043094680036, 'samples': 2402112, 'steps': 12510, 'loss/train': 1.6733269691467285} +11/06/2021 22:58:39 - INFO - __main__ - Step 12512: {'lr': 0.0004938031352985704, 'samples': 2402304, 'steps': 12511, 'loss/train': 1.8873792886734009} +11/06/2021 22:58:40 - INFO - __main__ - Step 12513: {'lr': 0.0004938019610192835, 'samples': 2402496, 'steps': 12512, 'loss/train': 2.266671657562256} +11/06/2021 22:58:40 - INFO - __main__ - Step 12514: {'lr': 0.0004938007866301429, 'samples': 2402688, 'steps': 12513, 'loss/train': 1.8477656841278076} +11/06/2021 22:58:40 - INFO - __main__ - Step 12515: {'lr': 0.0004937996121311496, 'samples': 2402880, 'steps': 12514, 'loss/train': 1.2845678329467773} +11/06/2021 22:58:41 - INFO - __main__ - Step 12516: {'lr': 0.000493798437522304, 'samples': 2403072, 'steps': 12515, 'loss/train': 1.3590694665908813} +11/06/2021 22:58:41 - INFO - __main__ - Step 12517: {'lr': 0.0004937972628036065, 'samples': 2403264, 'steps': 12516, 'loss/train': 1.4171817302703857} +11/06/2021 22:58:42 - INFO - __main__ - Step 12518: {'lr': 0.0004937960879750578, 'samples': 2403456, 'steps': 12517, 'loss/train': 1.5596864223480225} +11/06/2021 22:58:43 - INFO - __main__ - Step 12519: {'lr': 0.0004937949130366582, 'samples': 2403648, 'steps': 12518, 'loss/train': 1.6341605186462402} +11/06/2021 22:58:43 - INFO - __main__ - Step 12520: {'lr': 0.0004937937379884085, 'samples': 2403840, 'steps': 12519, 'loss/train': 1.1687759160995483} +11/06/2021 22:58:43 - INFO - __main__ - Step 12521: {'lr': 0.0004937925628303091, 'samples': 2404032, 'steps': 12520, 'loss/train': 1.7421510219573975} +11/06/2021 22:58:44 - INFO - __main__ - Step 12522: {'lr': 0.0004937913875623605, 'samples': 2404224, 'steps': 12521, 'loss/train': 1.12235426902771} +11/06/2021 22:58:44 - INFO - __main__ - Step 12523: {'lr': 0.0004937902121845633, 'samples': 2404416, 'steps': 12522, 'loss/train': 1.6094740629196167} +11/06/2021 22:58:45 - INFO - __main__ - Step 12524: {'lr': 0.000493789036696918, 'samples': 2404608, 'steps': 12523, 'loss/train': 1.749121069908142} +11/06/2021 22:58:45 - INFO - __main__ - Step 12525: {'lr': 0.000493787861099425, 'samples': 2404800, 'steps': 12524, 'loss/train': 1.0136215686798096} +11/06/2021 22:58:46 - INFO - __main__ - Step 12526: {'lr': 0.0004937866853920851, 'samples': 2404992, 'steps': 12525, 'loss/train': 1.7210983037948608} +11/06/2021 22:58:46 - INFO - __main__ - Step 12527: {'lr': 0.0004937855095748985, 'samples': 2405184, 'steps': 12526, 'loss/train': 1.8808726072311401} +11/06/2021 22:58:46 - INFO - __main__ - Step 12528: {'lr': 0.0004937843336478661, 'samples': 2405376, 'steps': 12527, 'loss/train': 1.6538246870040894} +11/06/2021 22:58:48 - INFO - __main__ - Step 12529: {'lr': 0.0004937831576109881, 'samples': 2405568, 'steps': 12528, 'loss/train': 1.4507884979248047} +11/06/2021 22:58:48 - INFO - __main__ - Step 12530: {'lr': 0.0004937819814642653, 'samples': 2405760, 'steps': 12529, 'loss/train': 1.7369753122329712} +11/06/2021 22:58:49 - INFO - __main__ - Step 12531: {'lr': 0.000493780805207698, 'samples': 2405952, 'steps': 12530, 'loss/train': 1.33586585521698} +11/06/2021 22:58:49 - INFO - __main__ - Step 12532: {'lr': 0.000493779628841287, 'samples': 2406144, 'steps': 12531, 'loss/train': 2.222987413406372} +11/06/2021 22:58:49 - INFO - __main__ - Step 12533: {'lr': 0.0004937784523650324, 'samples': 2406336, 'steps': 12532, 'loss/train': 0.8576833605766296} +11/06/2021 22:58:50 - INFO - __main__ - Step 12534: {'lr': 0.0004937772757789352, 'samples': 2406528, 'steps': 12533, 'loss/train': 0.9707418084144592} +11/06/2021 22:58:51 - INFO - __main__ - Step 12535: {'lr': 0.0004937760990829956, 'samples': 2406720, 'steps': 12534, 'loss/train': 1.9520204067230225} +11/06/2021 22:58:51 - INFO - __main__ - Step 12536: {'lr': 0.0004937749222772143, 'samples': 2406912, 'steps': 12535, 'loss/train': 1.7065337896347046} +11/06/2021 22:58:51 - INFO - __main__ - Step 12537: {'lr': 0.0004937737453615918, 'samples': 2407104, 'steps': 12536, 'loss/train': 1.8596389293670654} +11/06/2021 22:58:52 - INFO - __main__ - Step 12538: {'lr': 0.0004937725683361286, 'samples': 2407296, 'steps': 12537, 'loss/train': 1.6391980648040771} +11/06/2021 22:58:52 - INFO - __main__ - Step 12539: {'lr': 0.0004937713912008252, 'samples': 2407488, 'steps': 12538, 'loss/train': 0.9928711652755737} +11/06/2021 22:58:53 - INFO - __main__ - Step 12540: {'lr': 0.0004937702139556822, 'samples': 2407680, 'steps': 12539, 'loss/train': 2.0436432361602783} +11/06/2021 22:58:54 - INFO - __main__ - Step 12541: {'lr': 0.0004937690366007, 'samples': 2407872, 'steps': 12540, 'loss/train': 1.766875982284546} +11/06/2021 22:58:54 - INFO - __main__ - Step 12542: {'lr': 0.0004937678591358794, 'samples': 2408064, 'steps': 12541, 'loss/train': 1.9210069179534912} +11/06/2021 22:58:54 - INFO - __main__ - Step 12543: {'lr': 0.0004937666815612207, 'samples': 2408256, 'steps': 12542, 'loss/train': 1.523587703704834} +11/06/2021 22:58:55 - INFO - __main__ - Step 12544: {'lr': 0.0004937655038767245, 'samples': 2408448, 'steps': 12543, 'loss/train': 1.4020729064941406} +11/06/2021 22:58:56 - INFO - __main__ - Step 12545: {'lr': 0.0004937643260823914, 'samples': 2408640, 'steps': 12544, 'loss/train': 1.2543262243270874} +11/06/2021 22:58:56 - INFO - __main__ - Step 12546: {'lr': 0.0004937631481782218, 'samples': 2408832, 'steps': 12545, 'loss/train': 1.850257396697998} +11/06/2021 22:58:56 - INFO - __main__ - Step 12547: {'lr': 0.0004937619701642162, 'samples': 2409024, 'steps': 12546, 'loss/train': 2.321528434753418} +11/06/2021 22:58:57 - INFO - __main__ - Step 12548: {'lr': 0.0004937607920403752, 'samples': 2409216, 'steps': 12547, 'loss/train': 2.2833588123321533} +11/06/2021 22:58:57 - INFO - __main__ - Step 12549: {'lr': 0.0004937596138066996, 'samples': 2409408, 'steps': 12548, 'loss/train': 1.803352952003479} +11/06/2021 22:58:58 - INFO - __main__ - Step 12550: {'lr': 0.0004937584354631894, 'samples': 2409600, 'steps': 12549, 'loss/train': 2.182974100112915} +11/06/2021 22:58:58 - INFO - __main__ - Step 12551: {'lr': 0.0004937572570098455, 'samples': 2409792, 'steps': 12550, 'loss/train': 1.5153863430023193} +11/06/2021 22:58:59 - INFO - __main__ - Step 12552: {'lr': 0.0004937560784466685, 'samples': 2409984, 'steps': 12551, 'loss/train': 1.986527681350708} +11/06/2021 22:58:59 - INFO - __main__ - Step 12553: {'lr': 0.0004937548997736586, 'samples': 2410176, 'steps': 12552, 'loss/train': 1.3949472904205322} +11/06/2021 22:58:59 - INFO - __main__ - Step 12554: {'lr': 0.0004937537209908165, 'samples': 2410368, 'steps': 12553, 'loss/train': 1.5035032033920288} +11/06/2021 22:59:00 - INFO - __main__ - Step 12555: {'lr': 0.0004937525420981428, 'samples': 2410560, 'steps': 12554, 'loss/train': 2.261537790298462} +11/06/2021 22:59:01 - INFO - __main__ - Step 12556: {'lr': 0.0004937513630956379, 'samples': 2410752, 'steps': 12555, 'loss/train': 3.3203577995300293} +11/06/2021 22:59:01 - INFO - __main__ - Step 12557: {'lr': 0.0004937501839833024, 'samples': 2410944, 'steps': 12556, 'loss/train': 1.5435712337493896} +11/06/2021 22:59:01 - INFO - __main__ - Step 12558: {'lr': 0.0004937490047611369, 'samples': 2411136, 'steps': 12557, 'loss/train': 1.9833227396011353} +11/06/2021 22:59:02 - INFO - __main__ - Step 12559: {'lr': 0.0004937478254291418, 'samples': 2411328, 'steps': 12558, 'loss/train': 1.6904947757720947} +11/06/2021 22:59:02 - INFO - __main__ - Step 12560: {'lr': 0.0004937466459873178, 'samples': 2411520, 'steps': 12559, 'loss/train': 1.6554052829742432} +11/06/2021 22:59:03 - INFO - __main__ - Step 12561: {'lr': 0.0004937454664356652, 'samples': 2411712, 'steps': 12560, 'loss/train': 1.7198843955993652} +11/06/2021 22:59:04 - INFO - __main__ - Step 12562: {'lr': 0.0004937442867741848, 'samples': 2411904, 'steps': 12561, 'loss/train': 1.9236637353897095} +11/06/2021 22:59:04 - INFO - __main__ - Step 12563: {'lr': 0.0004937431070028768, 'samples': 2412096, 'steps': 12562, 'loss/train': 1.9572961330413818} +11/06/2021 22:59:04 - INFO - __main__ - Step 12564: {'lr': 0.0004937419271217419, 'samples': 2412288, 'steps': 12563, 'loss/train': 5.857589244842529} +11/06/2021 22:59:05 - INFO - __main__ - Step 12565: {'lr': 0.0004937407471307807, 'samples': 2412480, 'steps': 12564, 'loss/train': 1.5907723903656006} +11/06/2021 22:59:05 - INFO - __main__ - Step 12566: {'lr': 0.0004937395670299938, 'samples': 2412672, 'steps': 12565, 'loss/train': 1.3296524286270142} +11/06/2021 22:59:06 - INFO - __main__ - Step 12567: {'lr': 0.0004937383868193815, 'samples': 2412864, 'steps': 12566, 'loss/train': 1.7416648864746094} +11/06/2021 22:59:06 - INFO - __main__ - Step 12568: {'lr': 0.0004937372064989445, 'samples': 2413056, 'steps': 12567, 'loss/train': 1.3068746328353882} +11/06/2021 22:59:07 - INFO - __main__ - Step 12569: {'lr': 0.0004937360260686833, 'samples': 2413248, 'steps': 12568, 'loss/train': 1.8562533855438232} +11/06/2021 22:59:07 - INFO - __main__ - Step 12570: {'lr': 0.0004937348455285983, 'samples': 2413440, 'steps': 12569, 'loss/train': 1.5558427572250366} +11/06/2021 22:59:08 - INFO - __main__ - Step 12571: {'lr': 0.0004937336648786903, 'samples': 2413632, 'steps': 12570, 'loss/train': 1.8795865774154663} +11/06/2021 22:59:08 - INFO - __main__ - Step 12572: {'lr': 0.0004937324841189595, 'samples': 2413824, 'steps': 12571, 'loss/train': 1.9527837038040161} +11/06/2021 22:59:09 - INFO - __main__ - Step 12573: {'lr': 0.0004937313032494068, 'samples': 2414016, 'steps': 12572, 'loss/train': 1.613889217376709} +11/06/2021 22:59:09 - INFO - __main__ - Step 12574: {'lr': 0.0004937301222700324, 'samples': 2414208, 'steps': 12573, 'loss/train': 1.2357040643692017} +11/06/2021 22:59:10 - INFO - __main__ - Step 12575: {'lr': 0.0004937289411808369, 'samples': 2414400, 'steps': 12574, 'loss/train': 2.0651497840881348} +11/06/2021 22:59:10 - INFO - __main__ - Step 12576: {'lr': 0.000493727759981821, 'samples': 2414592, 'steps': 12575, 'loss/train': 1.5525745153427124} +11/06/2021 22:59:11 - INFO - __main__ - Step 12577: {'lr': 0.0004937265786729851, 'samples': 2414784, 'steps': 12576, 'loss/train': 0.8309584856033325} +11/06/2021 22:59:11 - INFO - __main__ - Step 12578: {'lr': 0.0004937253972543298, 'samples': 2414976, 'steps': 12577, 'loss/train': 2.5759201049804688} +11/06/2021 22:59:12 - INFO - __main__ - Step 12579: {'lr': 0.0004937242157258555, 'samples': 2415168, 'steps': 12578, 'loss/train': 2.0868546962738037} +11/06/2021 22:59:12 - INFO - __main__ - Step 12580: {'lr': 0.000493723034087563, 'samples': 2415360, 'steps': 12579, 'loss/train': 0.8102706074714661} +11/06/2021 22:59:12 - INFO - __main__ - Step 12581: {'lr': 0.0004937218523394525, 'samples': 2415552, 'steps': 12580, 'loss/train': 1.7701175212860107} +11/06/2021 22:59:13 - INFO - __main__ - Step 12582: {'lr': 0.0004937206704815248, 'samples': 2415744, 'steps': 12581, 'loss/train': 1.8174623250961304} +11/06/2021 22:59:14 - INFO - __main__ - Step 12583: {'lr': 0.0004937194885137803, 'samples': 2415936, 'steps': 12582, 'loss/train': 1.7041975259780884} +11/06/2021 22:59:14 - INFO - __main__ - Step 12584: {'lr': 0.0004937183064362196, 'samples': 2416128, 'steps': 12583, 'loss/train': 1.7389198541641235} +11/06/2021 22:59:14 - INFO - __main__ - Step 12585: {'lr': 0.0004937171242488431, 'samples': 2416320, 'steps': 12584, 'loss/train': 2.084197521209717} +11/06/2021 22:59:15 - INFO - __main__ - Step 12586: {'lr': 0.0004937159419516515, 'samples': 2416512, 'steps': 12585, 'loss/train': 1.9468644857406616} +11/06/2021 22:59:15 - INFO - __main__ - Step 12587: {'lr': 0.0004937147595446452, 'samples': 2416704, 'steps': 12586, 'loss/train': 1.4281747341156006} +11/06/2021 22:59:16 - INFO - __main__ - Step 12588: {'lr': 0.0004937135770278248, 'samples': 2416896, 'steps': 12587, 'loss/train': 1.688107967376709} +11/06/2021 22:59:17 - INFO - __main__ - Step 12589: {'lr': 0.0004937123944011908, 'samples': 2417088, 'steps': 12588, 'loss/train': 1.6565439701080322} +11/06/2021 22:59:17 - INFO - __main__ - Step 12590: {'lr': 0.0004937112116647439, 'samples': 2417280, 'steps': 12589, 'loss/train': 1.904050588607788} +11/06/2021 22:59:17 - INFO - __main__ - Step 12591: {'lr': 0.0004937100288184843, 'samples': 2417472, 'steps': 12590, 'loss/train': 1.9118624925613403} +11/06/2021 22:59:18 - INFO - __main__ - Step 12592: {'lr': 0.0004937088458624128, 'samples': 2417664, 'steps': 12591, 'loss/train': 1.8203307390213013} +11/06/2021 22:59:19 - INFO - __main__ - Step 12593: {'lr': 0.0004937076627965299, 'samples': 2417856, 'steps': 12592, 'loss/train': 2.2025625705718994} +11/06/2021 22:59:19 - INFO - __main__ - Step 12594: {'lr': 0.000493706479620836, 'samples': 2418048, 'steps': 12593, 'loss/train': 1.668437123298645} +11/06/2021 22:59:19 - INFO - __main__ - Step 12595: {'lr': 0.0004937052963353318, 'samples': 2418240, 'steps': 12594, 'loss/train': 0.7377382516860962} +11/06/2021 22:59:20 - INFO - __main__ - Step 12596: {'lr': 0.0004937041129400177, 'samples': 2418432, 'steps': 12595, 'loss/train': 2.0309805870056152} +11/06/2021 22:59:20 - INFO - __main__ - Step 12597: {'lr': 0.0004937029294348943, 'samples': 2418624, 'steps': 12596, 'loss/train': 2.111126661300659} +11/06/2021 22:59:21 - INFO - __main__ - Step 12598: {'lr': 0.0004937017458199621, 'samples': 2418816, 'steps': 12597, 'loss/train': 1.5420552492141724} +11/06/2021 22:59:21 - INFO - __main__ - Step 12599: {'lr': 0.0004937005620952217, 'samples': 2419008, 'steps': 12598, 'loss/train': 1.6897568702697754} +11/06/2021 22:59:22 - INFO - __main__ - Step 12600: {'lr': 0.0004936993782606735, 'samples': 2419200, 'steps': 12599, 'loss/train': 2.092362880706787} +11/06/2021 22:59:22 - INFO - __main__ - Step 12601: {'lr': 0.0004936981943163182, 'samples': 2419392, 'steps': 12600, 'loss/train': 1.7093287706375122} +11/06/2021 22:59:22 - INFO - __main__ - Step 12602: {'lr': 0.0004936970102621563, 'samples': 2419584, 'steps': 12601, 'loss/train': 1.4950854778289795} +11/06/2021 22:59:23 - INFO - __main__ - Step 12603: {'lr': 0.0004936958260981883, 'samples': 2419776, 'steps': 12602, 'loss/train': 1.867283582687378} +11/06/2021 22:59:24 - INFO - __main__ - Step 12604: {'lr': 0.0004936946418244146, 'samples': 2419968, 'steps': 12603, 'loss/train': 1.928859829902649} +11/06/2021 22:59:24 - INFO - __main__ - Step 12605: {'lr': 0.000493693457440836, 'samples': 2420160, 'steps': 12604, 'loss/train': 2.0806899070739746} +11/06/2021 22:59:25 - INFO - __main__ - Step 12606: {'lr': 0.0004936922729474526, 'samples': 2420352, 'steps': 12605, 'loss/train': 1.991079330444336} +11/06/2021 22:59:25 - INFO - __main__ - Step 12607: {'lr': 0.0004936910883442655, 'samples': 2420544, 'steps': 12606, 'loss/train': 1.499205231666565} +11/06/2021 22:59:25 - INFO - __main__ - Step 12608: {'lr': 0.0004936899036312749, 'samples': 2420736, 'steps': 12607, 'loss/train': 1.6349520683288574} +11/06/2021 22:59:26 - INFO - __main__ - Step 12609: {'lr': 0.0004936887188084813, 'samples': 2420928, 'steps': 12608, 'loss/train': 1.5434484481811523} +11/06/2021 22:59:27 - INFO - __main__ - Step 12610: {'lr': 0.0004936875338758855, 'samples': 2421120, 'steps': 12609, 'loss/train': 1.8176034688949585} +11/06/2021 22:59:27 - INFO - __main__ - Step 12611: {'lr': 0.0004936863488334877, 'samples': 2421312, 'steps': 12610, 'loss/train': 1.5530451536178589} +11/06/2021 22:59:27 - INFO - __main__ - Step 12612: {'lr': 0.0004936851636812886, 'samples': 2421504, 'steps': 12611, 'loss/train': 1.6083686351776123} +11/06/2021 22:59:28 - INFO - __main__ - Step 12613: {'lr': 0.0004936839784192888, 'samples': 2421696, 'steps': 12612, 'loss/train': 1.6676959991455078} +11/06/2021 22:59:29 - INFO - __main__ - Step 12614: {'lr': 0.0004936827930474887, 'samples': 2421888, 'steps': 12613, 'loss/train': 1.6996138095855713} +11/06/2021 22:59:29 - INFO - __main__ - Step 12615: {'lr': 0.0004936816075658889, 'samples': 2422080, 'steps': 12614, 'loss/train': 1.4866139888763428} +11/06/2021 22:59:30 - INFO - __main__ - Step 12616: {'lr': 0.00049368042197449, 'samples': 2422272, 'steps': 12615, 'loss/train': 1.4212651252746582} +11/06/2021 22:59:30 - INFO - __main__ - Step 12617: {'lr': 0.0004936792362732924, 'samples': 2422464, 'steps': 12616, 'loss/train': 1.7673671245574951} +11/06/2021 22:59:30 - INFO - __main__ - Step 12618: {'lr': 0.0004936780504622967, 'samples': 2422656, 'steps': 12617, 'loss/train': 0.7368472218513489} +11/06/2021 22:59:31 - INFO - __main__ - Step 12619: {'lr': 0.0004936768645415033, 'samples': 2422848, 'steps': 12618, 'loss/train': 1.724778652191162} +11/06/2021 22:59:32 - INFO - __main__ - Step 12620: {'lr': 0.0004936756785109131, 'samples': 2423040, 'steps': 12619, 'loss/train': 2.020928382873535} +11/06/2021 22:59:32 - INFO - __main__ - Step 12621: {'lr': 0.0004936744923705263, 'samples': 2423232, 'steps': 12620, 'loss/train': 1.8747974634170532} +11/06/2021 22:59:32 - INFO - __main__ - Step 12622: {'lr': 0.0004936733061203435, 'samples': 2423424, 'steps': 12621, 'loss/train': 1.8702856302261353} +11/06/2021 22:59:33 - INFO - __main__ - Step 12623: {'lr': 0.0004936721197603653, 'samples': 2423616, 'steps': 12622, 'loss/train': 2.058539628982544} +11/06/2021 22:59:34 - INFO - __main__ - Step 12624: {'lr': 0.0004936709332905923, 'samples': 2423808, 'steps': 12623, 'loss/train': 1.5451576709747314} +11/06/2021 22:59:34 - INFO - __main__ - Step 12625: {'lr': 0.0004936697467110248, 'samples': 2424000, 'steps': 12624, 'loss/train': 1.5256503820419312} +11/06/2021 22:59:34 - INFO - __main__ - Step 12626: {'lr': 0.0004936685600216635, 'samples': 2424192, 'steps': 12625, 'loss/train': 1.8777118921279907} +11/06/2021 22:59:35 - INFO - __main__ - Step 12627: {'lr': 0.0004936673732225088, 'samples': 2424384, 'steps': 12626, 'loss/train': 1.737566590309143} +11/06/2021 22:59:35 - INFO - __main__ - Step 12628: {'lr': 0.0004936661863135615, 'samples': 2424576, 'steps': 12627, 'loss/train': 1.7391878366470337} +11/06/2021 22:59:35 - INFO - __main__ - Step 12629: {'lr': 0.000493664999294822, 'samples': 2424768, 'steps': 12628, 'loss/train': 1.8638137578964233} +11/06/2021 22:59:37 - INFO - __main__ - Step 12630: {'lr': 0.0004936638121662908, 'samples': 2424960, 'steps': 12629, 'loss/train': 0.9604647159576416} +11/06/2021 22:59:37 - INFO - __main__ - Step 12631: {'lr': 0.0004936626249279683, 'samples': 2425152, 'steps': 12630, 'loss/train': 1.9379112720489502} +11/06/2021 22:59:37 - INFO - __main__ - Step 12632: {'lr': 0.0004936614375798553, 'samples': 2425344, 'steps': 12631, 'loss/train': 0.7208963632583618} +11/06/2021 22:59:38 - INFO - __main__ - Step 12633: {'lr': 0.0004936602501219522, 'samples': 2425536, 'steps': 12632, 'loss/train': 1.7763961553573608} +11/06/2021 22:59:38 - INFO - __main__ - Step 12634: {'lr': 0.0004936590625542595, 'samples': 2425728, 'steps': 12633, 'loss/train': 1.4927427768707275} +11/06/2021 22:59:39 - INFO - __main__ - Step 12635: {'lr': 0.0004936578748767779, 'samples': 2425920, 'steps': 12634, 'loss/train': 1.5714725255966187} +11/06/2021 22:59:40 - INFO - __main__ - Step 12636: {'lr': 0.0004936566870895078, 'samples': 2426112, 'steps': 12635, 'loss/train': 1.6926263570785522} +11/06/2021 22:59:40 - INFO - __main__ - Step 12637: {'lr': 0.0004936554991924496, 'samples': 2426304, 'steps': 12636, 'loss/train': 0.9753442406654358} +11/06/2021 22:59:40 - INFO - __main__ - Step 12638: {'lr': 0.0004936543111856041, 'samples': 2426496, 'steps': 12637, 'loss/train': 1.6684590578079224} +11/06/2021 22:59:41 - INFO - __main__ - Step 12639: {'lr': 0.0004936531230689717, 'samples': 2426688, 'steps': 12638, 'loss/train': 1.6691287755966187} +11/06/2021 22:59:42 - INFO - __main__ - Step 12640: {'lr': 0.000493651934842553, 'samples': 2426880, 'steps': 12639, 'loss/train': 1.628665566444397} +11/06/2021 22:59:42 - INFO - __main__ - Step 12641: {'lr': 0.0004936507465063486, 'samples': 2427072, 'steps': 12640, 'loss/train': 1.266121745109558} +11/06/2021 22:59:42 - INFO - __main__ - Step 12642: {'lr': 0.0004936495580603588, 'samples': 2427264, 'steps': 12641, 'loss/train': 1.7384616136550903} +11/06/2021 22:59:43 - INFO - __main__ - Step 12643: {'lr': 0.0004936483695045842, 'samples': 2427456, 'steps': 12642, 'loss/train': 1.6067787408828735} +11/06/2021 22:59:43 - INFO - __main__ - Step 12644: {'lr': 0.0004936471808390254, 'samples': 2427648, 'steps': 12643, 'loss/train': 1.7227269411087036} +11/06/2021 22:59:44 - INFO - __main__ - Step 12645: {'lr': 0.0004936459920636832, 'samples': 2427840, 'steps': 12644, 'loss/train': 1.4939666986465454} +11/06/2021 22:59:44 - INFO - __main__ - Step 12646: {'lr': 0.0004936448031785576, 'samples': 2428032, 'steps': 12645, 'loss/train': 1.5351349115371704} +11/06/2021 22:59:45 - INFO - __main__ - Step 12647: {'lr': 0.0004936436141836496, 'samples': 2428224, 'steps': 12646, 'loss/train': 1.6882507801055908} +11/06/2021 22:59:45 - INFO - __main__ - Step 12648: {'lr': 0.0004936424250789594, 'samples': 2428416, 'steps': 12647, 'loss/train': 2.1467108726501465} +11/06/2021 22:59:45 - INFO - __main__ - Step 12649: {'lr': 0.0004936412358644878, 'samples': 2428608, 'steps': 12648, 'loss/train': 1.2412645816802979} +11/06/2021 22:59:47 - INFO - __main__ - Step 12650: {'lr': 0.0004936400465402351, 'samples': 2428800, 'steps': 12649, 'loss/train': 1.8610800504684448} +11/06/2021 22:59:47 - INFO - __main__ - Step 12651: {'lr': 0.0004936388571062021, 'samples': 2428992, 'steps': 12650, 'loss/train': 0.7149181365966797} +11/06/2021 22:59:47 - INFO - __main__ - Step 12652: {'lr': 0.0004936376675623892, 'samples': 2429184, 'steps': 12651, 'loss/train': 1.40529203414917} +11/06/2021 22:59:48 - INFO - __main__ - Step 12653: {'lr': 0.0004936364779087967, 'samples': 2429376, 'steps': 12652, 'loss/train': 1.6117287874221802} +11/06/2021 22:59:48 - INFO - __main__ - Step 12654: {'lr': 0.0004936352881454256, 'samples': 2429568, 'steps': 12653, 'loss/train': 1.6259452104568481} +11/06/2021 22:59:49 - INFO - __main__ - Step 12655: {'lr': 0.000493634098272276, 'samples': 2429760, 'steps': 12654, 'loss/train': 0.9939618706703186} +11/06/2021 22:59:49 - INFO - __main__ - Step 12656: {'lr': 0.0004936329082893488, 'samples': 2429952, 'steps': 12655, 'loss/train': 1.6605446338653564} +11/06/2021 22:59:50 - INFO - __main__ - Step 12657: {'lr': 0.0004936317181966443, 'samples': 2430144, 'steps': 12656, 'loss/train': 1.8564437627792358} +11/06/2021 22:59:50 - INFO - __main__ - Step 12658: {'lr': 0.000493630527994163, 'samples': 2430336, 'steps': 12657, 'loss/train': 1.9009116888046265} +11/06/2021 22:59:50 - INFO - __main__ - Step 12659: {'lr': 0.0004936293376819058, 'samples': 2430528, 'steps': 12658, 'loss/train': 1.7733248472213745} +11/06/2021 22:59:52 - INFO - __main__ - Step 12660: {'lr': 0.0004936281472598728, 'samples': 2430720, 'steps': 12659, 'loss/train': 1.9527031183242798} +11/06/2021 22:59:52 - INFO - __main__ - Step 12661: {'lr': 0.0004936269567280648, 'samples': 2430912, 'steps': 12660, 'loss/train': 1.9170464277267456} +11/06/2021 22:59:52 - INFO - __main__ - Step 12662: {'lr': 0.0004936257660864822, 'samples': 2431104, 'steps': 12661, 'loss/train': 1.2196903228759766} +11/06/2021 22:59:53 - INFO - __main__ - Step 12663: {'lr': 0.0004936245753351256, 'samples': 2431296, 'steps': 12662, 'loss/train': 1.9647890329360962} +11/06/2021 22:59:53 - INFO - __main__ - Step 12664: {'lr': 0.0004936233844739955, 'samples': 2431488, 'steps': 12663, 'loss/train': 1.9114571809768677} +11/06/2021 22:59:54 - INFO - __main__ - Step 12665: {'lr': 0.0004936221935030924, 'samples': 2431680, 'steps': 12664, 'loss/train': 1.2946553230285645} +11/06/2021 22:59:54 - INFO - __main__ - Step 12666: {'lr': 0.000493621002422417, 'samples': 2431872, 'steps': 12665, 'loss/train': 1.6806825399398804} +11/06/2021 22:59:55 - INFO - __main__ - Step 12667: {'lr': 0.0004936198112319698, 'samples': 2432064, 'steps': 12666, 'loss/train': 1.6497493982315063} +11/06/2021 22:59:55 - INFO - __main__ - Step 12668: {'lr': 0.0004936186199317511, 'samples': 2432256, 'steps': 12667, 'loss/train': 0.71175217628479} +11/06/2021 22:59:55 - INFO - __main__ - Step 12669: {'lr': 0.0004936174285217618, 'samples': 2432448, 'steps': 12668, 'loss/train': 2.324061393737793} +11/06/2021 22:59:56 - INFO - __main__ - Step 12670: {'lr': 0.0004936162370020021, 'samples': 2432640, 'steps': 12669, 'loss/train': 1.2230273485183716} +11/06/2021 22:59:57 - INFO - __main__ - Step 12671: {'lr': 0.0004936150453724727, 'samples': 2432832, 'steps': 12670, 'loss/train': 1.6716129779815674} +11/06/2021 22:59:57 - INFO - __main__ - Step 12672: {'lr': 0.0004936138536331742, 'samples': 2433024, 'steps': 12671, 'loss/train': 1.5442752838134766} +11/06/2021 22:59:58 - INFO - __main__ - Step 12673: {'lr': 0.000493612661784107, 'samples': 2433216, 'steps': 12672, 'loss/train': 1.818224310874939} +11/06/2021 22:59:58 - INFO - __main__ - Step 12674: {'lr': 0.0004936114698252717, 'samples': 2433408, 'steps': 12673, 'loss/train': 1.5145035982131958} +11/06/2021 22:59:58 - INFO - __main__ - Step 12675: {'lr': 0.0004936102777566688, 'samples': 2433600, 'steps': 12674, 'loss/train': 0.6831874847412109} +11/06/2021 22:59:59 - INFO - __main__ - Step 12676: {'lr': 0.0004936090855782989, 'samples': 2433792, 'steps': 12675, 'loss/train': 1.201375961303711} +11/06/2021 23:00:00 - INFO - __main__ - Step 12677: {'lr': 0.0004936078932901625, 'samples': 2433984, 'steps': 12676, 'loss/train': 1.8787459135055542} +11/06/2021 23:00:00 - INFO - __main__ - Step 12678: {'lr': 0.0004936067008922602, 'samples': 2434176, 'steps': 12677, 'loss/train': 2.3367536067962646} +11/06/2021 23:00:00 - INFO - __main__ - Step 12679: {'lr': 0.0004936055083845924, 'samples': 2434368, 'steps': 12678, 'loss/train': 1.7321808338165283} +11/06/2021 23:00:01 - INFO - __main__ - Step 12680: {'lr': 0.0004936043157671597, 'samples': 2434560, 'steps': 12679, 'loss/train': 1.1493476629257202} +11/06/2021 23:00:02 - INFO - __main__ - Step 12681: {'lr': 0.0004936031230399628, 'samples': 2434752, 'steps': 12680, 'loss/train': 1.7847900390625} +11/06/2021 23:00:02 - INFO - __main__ - Step 12682: {'lr': 0.000493601930203002, 'samples': 2434944, 'steps': 12681, 'loss/train': 1.8895950317382812} +11/06/2021 23:00:03 - INFO - __main__ - Step 12683: {'lr': 0.0004936007372562778, 'samples': 2435136, 'steps': 12682, 'loss/train': 1.703395128250122} +11/06/2021 23:00:03 - INFO - __main__ - Step 12684: {'lr': 0.0004935995441997911, 'samples': 2435328, 'steps': 12683, 'loss/train': 1.5084177255630493} +11/06/2021 23:00:03 - INFO - __main__ - Step 12685: {'lr': 0.000493598351033542, 'samples': 2435520, 'steps': 12684, 'loss/train': 1.2693252563476562} +11/06/2021 23:00:04 - INFO - __main__ - Step 12686: {'lr': 0.0004935971577575313, 'samples': 2435712, 'steps': 12685, 'loss/train': 1.772753357887268} +11/06/2021 23:00:05 - INFO - __main__ - Step 12687: {'lr': 0.0004935959643717595, 'samples': 2435904, 'steps': 12686, 'loss/train': 1.3232539892196655} +11/06/2021 23:00:05 - INFO - __main__ - Step 12688: {'lr': 0.0004935947708762272, 'samples': 2436096, 'steps': 12687, 'loss/train': 1.1217036247253418} +11/06/2021 23:00:05 - INFO - __main__ - Step 12689: {'lr': 0.0004935935772709348, 'samples': 2436288, 'steps': 12688, 'loss/train': 2.837244987487793} +11/06/2021 23:00:06 - INFO - __main__ - Step 12690: {'lr': 0.0004935923835558829, 'samples': 2436480, 'steps': 12689, 'loss/train': 1.7220159769058228} +11/06/2021 23:00:07 - INFO - __main__ - Step 12691: {'lr': 0.0004935911897310719, 'samples': 2436672, 'steps': 12690, 'loss/train': 1.8013556003570557} +11/06/2021 23:00:07 - INFO - __main__ - Step 12692: {'lr': 0.0004935899957965027, 'samples': 2436864, 'steps': 12691, 'loss/train': 1.6648582220077515} +11/06/2021 23:00:07 - INFO - __main__ - Step 12693: {'lr': 0.0004935888017521754, 'samples': 2437056, 'steps': 12692, 'loss/train': 2.0813040733337402} +11/06/2021 23:00:08 - INFO - __main__ - Step 12694: {'lr': 0.0004935876075980908, 'samples': 2437248, 'steps': 12693, 'loss/train': 1.7684749364852905} +11/06/2021 23:00:08 - INFO - __main__ - Step 12695: {'lr': 0.0004935864133342495, 'samples': 2437440, 'steps': 12694, 'loss/train': 1.6431411504745483} +11/06/2021 23:00:09 - INFO - __main__ - Step 12696: {'lr': 0.0004935852189606517, 'samples': 2437632, 'steps': 12695, 'loss/train': 1.6132627725601196} +11/06/2021 23:00:09 - INFO - __main__ - Step 12697: {'lr': 0.0004935840244772984, 'samples': 2437824, 'steps': 12696, 'loss/train': 1.5991240739822388} +11/06/2021 23:00:10 - INFO - __main__ - Step 12698: {'lr': 0.0004935828298841898, 'samples': 2438016, 'steps': 12697, 'loss/train': 1.5647183656692505} +11/06/2021 23:00:10 - INFO - __main__ - Step 12699: {'lr': 0.0004935816351813265, 'samples': 2438208, 'steps': 12698, 'loss/train': 1.92881441116333} +11/06/2021 23:00:11 - INFO - __main__ - Step 12700: {'lr': 0.0004935804403687091, 'samples': 2438400, 'steps': 12699, 'loss/train': 1.8408360481262207} +11/06/2021 23:00:11 - INFO - __main__ - Step 12701: {'lr': 0.0004935792454463381, 'samples': 2438592, 'steps': 12700, 'loss/train': 1.49015212059021} +11/06/2021 23:00:12 - INFO - __main__ - Step 12702: {'lr': 0.000493578050414214, 'samples': 2438784, 'steps': 12701, 'loss/train': 1.8693770170211792} +11/06/2021 23:00:12 - INFO - __main__ - Step 12703: {'lr': 0.0004935768552723375, 'samples': 2438976, 'steps': 12702, 'loss/train': 1.6412677764892578} +11/06/2021 23:00:13 - INFO - __main__ - Step 12704: {'lr': 0.000493575660020709, 'samples': 2439168, 'steps': 12703, 'loss/train': 1.6965235471725464} +11/06/2021 23:00:13 - INFO - __main__ - Step 12705: {'lr': 0.000493574464659329, 'samples': 2439360, 'steps': 12704, 'loss/train': 1.4000598192214966} +11/06/2021 23:00:13 - INFO - __main__ - Step 12706: {'lr': 0.0004935732691881981, 'samples': 2439552, 'steps': 12705, 'loss/train': 1.8921767473220825} +11/06/2021 23:00:14 - INFO - __main__ - Step 12707: {'lr': 0.0004935720736073169, 'samples': 2439744, 'steps': 12706, 'loss/train': 1.973684310913086} +11/06/2021 23:00:15 - INFO - __main__ - Step 12708: {'lr': 0.0004935708779166859, 'samples': 2439936, 'steps': 12707, 'loss/train': 1.2805671691894531} +11/06/2021 23:00:15 - INFO - __main__ - Step 12709: {'lr': 0.0004935696821163056, 'samples': 2440128, 'steps': 12708, 'loss/train': 1.9279905557632446} +11/06/2021 23:00:15 - INFO - __main__ - Step 12710: {'lr': 0.0004935684862061766, 'samples': 2440320, 'steps': 12709, 'loss/train': 1.654013991355896} +11/06/2021 23:00:16 - INFO - __main__ - Step 12711: {'lr': 0.0004935672901862993, 'samples': 2440512, 'steps': 12710, 'loss/train': 1.4374395608901978} +11/06/2021 23:00:17 - INFO - __main__ - Step 12712: {'lr': 0.0004935660940566744, 'samples': 2440704, 'steps': 12711, 'loss/train': 1.640486240386963} +11/06/2021 23:00:17 - INFO - __main__ - Step 12713: {'lr': 0.0004935648978173024, 'samples': 2440896, 'steps': 12712, 'loss/train': 1.7238794565200806} +11/06/2021 23:00:17 - INFO - __main__ - Step 12714: {'lr': 0.0004935637014681837, 'samples': 2441088, 'steps': 12713, 'loss/train': 1.8015981912612915} +11/06/2021 23:00:18 - INFO - __main__ - Step 12715: {'lr': 0.0004935625050093191, 'samples': 2441280, 'steps': 12714, 'loss/train': 1.7736315727233887} +11/06/2021 23:00:18 - INFO - __main__ - Step 12716: {'lr': 0.000493561308440709, 'samples': 2441472, 'steps': 12715, 'loss/train': 1.336901068687439} +11/06/2021 23:00:19 - INFO - __main__ - Step 12717: {'lr': 0.0004935601117623538, 'samples': 2441664, 'steps': 12716, 'loss/train': 1.488775610923767} +11/06/2021 23:00:19 - INFO - __main__ - Step 12718: {'lr': 0.0004935589149742542, 'samples': 2441856, 'steps': 12717, 'loss/train': 2.1799232959747314} +11/06/2021 23:00:20 - INFO - __main__ - Step 12719: {'lr': 0.0004935577180764108, 'samples': 2442048, 'steps': 12718, 'loss/train': 1.3624755144119263} +11/06/2021 23:00:20 - INFO - __main__ - Step 12720: {'lr': 0.000493556521068824, 'samples': 2442240, 'steps': 12719, 'loss/train': 1.883273720741272} +11/06/2021 23:00:21 - INFO - __main__ - Step 12721: {'lr': 0.0004935553239514943, 'samples': 2442432, 'steps': 12720, 'loss/train': 1.8159416913986206} +11/06/2021 23:00:22 - INFO - __main__ - Step 12722: {'lr': 0.0004935541267244225, 'samples': 2442624, 'steps': 12721, 'loss/train': 1.7805633544921875} +11/06/2021 23:00:22 - INFO - __main__ - Step 12723: {'lr': 0.0004935529293876088, 'samples': 2442816, 'steps': 12722, 'loss/train': 1.8284835815429688} +11/06/2021 23:00:22 - INFO - __main__ - Step 12724: {'lr': 0.000493551731941054, 'samples': 2443008, 'steps': 12723, 'loss/train': 1.8245835304260254} +11/06/2021 23:00:23 - INFO - __main__ - Step 12725: {'lr': 0.0004935505343847586, 'samples': 2443200, 'steps': 12724, 'loss/train': 1.665300965309143} +11/06/2021 23:00:23 - INFO - __main__ - Step 12726: {'lr': 0.000493549336718723, 'samples': 2443392, 'steps': 12725, 'loss/train': 1.5313256978988647} +11/06/2021 23:00:23 - INFO - __main__ - Step 12727: {'lr': 0.0004935481389429479, 'samples': 2443584, 'steps': 12726, 'loss/train': 1.2466456890106201} +11/06/2021 23:00:24 - INFO - __main__ - Step 12728: {'lr': 0.0004935469410574337, 'samples': 2443776, 'steps': 12727, 'loss/train': 1.5720294713974} +11/06/2021 23:00:25 - INFO - __main__ - Step 12729: {'lr': 0.000493545743062181, 'samples': 2443968, 'steps': 12728, 'loss/train': 1.831040382385254} +11/06/2021 23:00:25 - INFO - __main__ - Step 12730: {'lr': 0.0004935445449571903, 'samples': 2444160, 'steps': 12729, 'loss/train': 1.5608617067337036} +11/06/2021 23:00:26 - INFO - __main__ - Step 12731: {'lr': 0.0004935433467424624, 'samples': 2444352, 'steps': 12730, 'loss/train': 1.843248963356018} +11/06/2021 23:00:26 - INFO - __main__ - Step 12732: {'lr': 0.0004935421484179974, 'samples': 2444544, 'steps': 12731, 'loss/train': 1.858343243598938} +11/06/2021 23:00:27 - INFO - __main__ - Step 12733: {'lr': 0.0004935409499837962, 'samples': 2444736, 'steps': 12732, 'loss/train': 2.449708938598633} +11/06/2021 23:00:27 - INFO - __main__ - Step 12734: {'lr': 0.0004935397514398591, 'samples': 2444928, 'steps': 12733, 'loss/train': 1.2555254697799683} +11/06/2021 23:00:27 - INFO - __main__ - Step 12735: {'lr': 0.0004935385527861869, 'samples': 2445120, 'steps': 12734, 'loss/train': 1.8298964500427246} +11/06/2021 23:00:28 - INFO - __main__ - Step 12736: {'lr': 0.0004935373540227798, 'samples': 2445312, 'steps': 12735, 'loss/train': 1.8937606811523438} +11/06/2021 23:00:28 - INFO - __main__ - Step 12737: {'lr': 0.0004935361551496387, 'samples': 2445504, 'steps': 12736, 'loss/train': 1.5406252145767212} +11/06/2021 23:00:29 - INFO - __main__ - Step 12738: {'lr': 0.0004935349561667638, 'samples': 2445696, 'steps': 12737, 'loss/train': 1.3331429958343506} +11/06/2021 23:00:30 - INFO - __main__ - Step 12739: {'lr': 0.000493533757074156, 'samples': 2445888, 'steps': 12738, 'loss/train': 1.462608814239502} +11/06/2021 23:00:30 - INFO - __main__ - Step 12740: {'lr': 0.0004935325578718155, 'samples': 2446080, 'steps': 12739, 'loss/train': 1.7719459533691406} +11/06/2021 23:00:30 - INFO - __main__ - Step 12741: {'lr': 0.000493531358559743, 'samples': 2446272, 'steps': 12740, 'loss/train': 1.849948525428772} +11/06/2021 23:00:31 - INFO - __main__ - Step 12742: {'lr': 0.0004935301591379391, 'samples': 2446464, 'steps': 12741, 'loss/train': 2.125699520111084} +11/06/2021 23:00:32 - INFO - __main__ - Step 12743: {'lr': 0.0004935289596064042, 'samples': 2446656, 'steps': 12742, 'loss/train': 1.4492217302322388} +11/06/2021 23:00:32 - INFO - __main__ - Step 12744: {'lr': 0.0004935277599651389, 'samples': 2446848, 'steps': 12743, 'loss/train': 1.4659162759780884} +11/06/2021 23:00:32 - INFO - __main__ - Step 12745: {'lr': 0.0004935265602141437, 'samples': 2447040, 'steps': 12744, 'loss/train': 2.072901964187622} +11/06/2021 23:00:33 - INFO - __main__ - Step 12746: {'lr': 0.0004935253603534193, 'samples': 2447232, 'steps': 12745, 'loss/train': 1.745668649673462} +11/06/2021 23:00:33 - INFO - __main__ - Step 12747: {'lr': 0.0004935241603829661, 'samples': 2447424, 'steps': 12746, 'loss/train': 1.9850726127624512} +11/06/2021 23:00:34 - INFO - __main__ - Step 12748: {'lr': 0.0004935229603027847, 'samples': 2447616, 'steps': 12747, 'loss/train': 1.3477630615234375} +11/06/2021 23:00:34 - INFO - __main__ - Step 12749: {'lr': 0.0004935217601128755, 'samples': 2447808, 'steps': 12748, 'loss/train': 1.7236028909683228} +11/06/2021 23:00:35 - INFO - __main__ - Step 12750: {'lr': 0.0004935205598132393, 'samples': 2448000, 'steps': 12749, 'loss/train': 1.637121319770813} +11/06/2021 23:00:35 - INFO - __main__ - Step 12751: {'lr': 0.0004935193594038764, 'samples': 2448192, 'steps': 12750, 'loss/train': 1.4060014486312866} +11/06/2021 23:00:35 - INFO - __main__ - Step 12752: {'lr': 0.0004935181588847876, 'samples': 2448384, 'steps': 12751, 'loss/train': 1.7447482347488403} +11/06/2021 23:00:36 - INFO - __main__ - Step 12753: {'lr': 0.0004935169582559731, 'samples': 2448576, 'steps': 12752, 'loss/train': 2.0324788093566895} +11/06/2021 23:00:37 - INFO - __main__ - Step 12754: {'lr': 0.0004935157575174336, 'samples': 2448768, 'steps': 12753, 'loss/train': 1.7007369995117188} +11/06/2021 23:00:37 - INFO - __main__ - Step 12755: {'lr': 0.0004935145566691698, 'samples': 2448960, 'steps': 12754, 'loss/train': 1.9936100244522095} +11/06/2021 23:00:37 - INFO - __main__ - Step 12756: {'lr': 0.000493513355711182, 'samples': 2449152, 'steps': 12755, 'loss/train': 1.6351784467697144} +11/06/2021 23:00:38 - INFO - __main__ - Step 12757: {'lr': 0.0004935121546434708, 'samples': 2449344, 'steps': 12756, 'loss/train': 1.7019697427749634} +11/06/2021 23:00:39 - INFO - __main__ - Step 12758: {'lr': 0.0004935109534660368, 'samples': 2449536, 'steps': 12757, 'loss/train': 1.8127813339233398} +11/06/2021 23:00:39 - INFO - __main__ - Step 12759: {'lr': 0.0004935097521788805, 'samples': 2449728, 'steps': 12758, 'loss/train': 0.67855304479599} +11/06/2021 23:00:40 - INFO - __main__ - Step 12760: {'lr': 0.0004935085507820026, 'samples': 2449920, 'steps': 12759, 'loss/train': 2.1449859142303467} +11/06/2021 23:00:40 - INFO - __main__ - Step 12761: {'lr': 0.0004935073492754034, 'samples': 2450112, 'steps': 12760, 'loss/train': 1.3522168397903442} +11/06/2021 23:00:40 - INFO - __main__ - Step 12762: {'lr': 0.0004935061476590835, 'samples': 2450304, 'steps': 12761, 'loss/train': 0.9896982908248901} +11/06/2021 23:00:41 - INFO - __main__ - Step 12763: {'lr': 0.0004935049459330437, 'samples': 2450496, 'steps': 12762, 'loss/train': 1.8502204418182373} +11/06/2021 23:00:42 - INFO - __main__ - Step 12764: {'lr': 0.0004935037440972841, 'samples': 2450688, 'steps': 12763, 'loss/train': 2.6931633949279785} +11/06/2021 23:00:42 - INFO - __main__ - Step 12765: {'lr': 0.0004935025421518056, 'samples': 2450880, 'steps': 12764, 'loss/train': 1.5279968976974487} +11/06/2021 23:00:42 - INFO - __main__ - Step 12766: {'lr': 0.0004935013400966086, 'samples': 2451072, 'steps': 12765, 'loss/train': 1.7780354022979736} +11/06/2021 23:00:43 - INFO - __main__ - Step 12767: {'lr': 0.0004935001379316935, 'samples': 2451264, 'steps': 12766, 'loss/train': 1.5596141815185547} +11/06/2021 23:00:43 - INFO - __main__ - Step 12768: {'lr': 0.0004934989356570611, 'samples': 2451456, 'steps': 12767, 'loss/train': 1.7943576574325562} +11/06/2021 23:00:44 - INFO - __main__ - Step 12769: {'lr': 0.0004934977332727118, 'samples': 2451648, 'steps': 12768, 'loss/train': 1.703242301940918} +11/06/2021 23:00:44 - INFO - __main__ - Step 12770: {'lr': 0.0004934965307786464, 'samples': 2451840, 'steps': 12769, 'loss/train': 1.6350740194320679} +11/06/2021 23:00:45 - INFO - __main__ - Step 12771: {'lr': 0.0004934953281748649, 'samples': 2452032, 'steps': 12770, 'loss/train': 1.350691318511963} +11/06/2021 23:00:45 - INFO - __main__ - Step 12772: {'lr': 0.0004934941254613684, 'samples': 2452224, 'steps': 12771, 'loss/train': 1.6434681415557861} +11/06/2021 23:00:45 - INFO - __main__ - Step 12773: {'lr': 0.0004934929226381572, 'samples': 2452416, 'steps': 12772, 'loss/train': 1.567505121231079} +11/06/2021 23:00:47 - INFO - __main__ - Step 12774: {'lr': 0.0004934917197052317, 'samples': 2452608, 'steps': 12773, 'loss/train': 1.6525659561157227} +11/06/2021 23:00:47 - INFO - __main__ - Step 12775: {'lr': 0.0004934905166625926, 'samples': 2452800, 'steps': 12774, 'loss/train': 1.8389402627944946} +11/06/2021 23:00:48 - INFO - __main__ - Step 12776: {'lr': 0.0004934893135102405, 'samples': 2452992, 'steps': 12775, 'loss/train': 0.4809941351413727} +11/06/2021 23:00:48 - INFO - __main__ - Step 12777: {'lr': 0.0004934881102481759, 'samples': 2453184, 'steps': 12776, 'loss/train': 1.6852707862854004} +11/06/2021 23:00:48 - INFO - __main__ - Step 12778: {'lr': 0.0004934869068763992, 'samples': 2453376, 'steps': 12777, 'loss/train': 1.8732150793075562} +11/06/2021 23:00:49 - INFO - __main__ - Step 12779: {'lr': 0.0004934857033949112, 'samples': 2453568, 'steps': 12778, 'loss/train': 1.4058620929718018} +11/06/2021 23:00:49 - INFO - __main__ - Step 12780: {'lr': 0.0004934844998037122, 'samples': 2453760, 'steps': 12779, 'loss/train': 1.6926714181900024} +11/06/2021 23:00:50 - INFO - __main__ - Step 12781: {'lr': 0.0004934832961028028, 'samples': 2453952, 'steps': 12780, 'loss/train': 1.8323222398757935} +11/06/2021 23:00:50 - INFO - __main__ - Step 12782: {'lr': 0.0004934820922921836, 'samples': 2454144, 'steps': 12781, 'loss/train': 1.9833849668502808} +11/06/2021 23:00:51 - INFO - __main__ - Step 12783: {'lr': 0.0004934808883718553, 'samples': 2454336, 'steps': 12782, 'loss/train': 1.3475416898727417} +11/06/2021 23:00:52 - INFO - __main__ - Step 12784: {'lr': 0.0004934796843418181, 'samples': 2454528, 'steps': 12783, 'loss/train': 1.8701623678207397} +11/06/2021 23:00:52 - INFO - __main__ - Step 12785: {'lr': 0.0004934784802020728, 'samples': 2454720, 'steps': 12784, 'loss/train': 1.69837486743927} +11/06/2021 23:00:52 - INFO - __main__ - Step 12786: {'lr': 0.0004934772759526198, 'samples': 2454912, 'steps': 12785, 'loss/train': 1.8089841604232788} +11/06/2021 23:00:53 - INFO - __main__ - Step 12787: {'lr': 0.0004934760715934597, 'samples': 2455104, 'steps': 12786, 'loss/train': 1.5334937572479248} +11/06/2021 23:00:53 - INFO - __main__ - Step 12788: {'lr': 0.0004934748671245931, 'samples': 2455296, 'steps': 12787, 'loss/train': 1.691651463508606} +11/06/2021 23:00:54 - INFO - __main__ - Step 12789: {'lr': 0.0004934736625460203, 'samples': 2455488, 'steps': 12788, 'loss/train': 1.8990588188171387} +11/06/2021 23:00:54 - INFO - __main__ - Step 12790: {'lr': 0.0004934724578577422, 'samples': 2455680, 'steps': 12789, 'loss/train': 1.2063190937042236} +11/06/2021 23:00:55 - INFO - __main__ - Step 12791: {'lr': 0.0004934712530597591, 'samples': 2455872, 'steps': 12790, 'loss/train': 1.6075855493545532} +11/06/2021 23:00:55 - INFO - __main__ - Step 12792: {'lr': 0.0004934700481520717, 'samples': 2456064, 'steps': 12791, 'loss/train': 1.9511923789978027} +11/06/2021 23:00:55 - INFO - __main__ - Step 12793: {'lr': 0.0004934688431346804, 'samples': 2456256, 'steps': 12792, 'loss/train': 1.5929433107376099} +11/06/2021 23:00:56 - INFO - __main__ - Step 12794: {'lr': 0.0004934676380075857, 'samples': 2456448, 'steps': 12793, 'loss/train': 1.243303894996643} +11/06/2021 23:00:57 - INFO - __main__ - Step 12795: {'lr': 0.0004934664327707884, 'samples': 2456640, 'steps': 12794, 'loss/train': 2.0900375843048096} +11/06/2021 23:00:57 - INFO - __main__ - Step 12796: {'lr': 0.0004934652274242888, 'samples': 2456832, 'steps': 12795, 'loss/train': 1.7989342212677002} +11/06/2021 23:00:58 - INFO - __main__ - Step 12797: {'lr': 0.0004934640219680875, 'samples': 2457024, 'steps': 12796, 'loss/train': 0.9342484474182129} +11/06/2021 23:00:58 - INFO - __main__ - Step 12798: {'lr': 0.0004934628164021851, 'samples': 2457216, 'steps': 12797, 'loss/train': 0.24721074104309082} +11/06/2021 23:00:59 - INFO - __main__ - Step 12799: {'lr': 0.0004934616107265821, 'samples': 2457408, 'steps': 12798, 'loss/train': 2.198434591293335} +11/06/2021 23:00:59 - INFO - __main__ - Step 12800: {'lr': 0.0004934604049412791, 'samples': 2457600, 'steps': 12799, 'loss/train': 1.550801157951355} +11/06/2021 23:01:00 - INFO - __main__ - Step 12801: {'lr': 0.0004934591990462766, 'samples': 2457792, 'steps': 12800, 'loss/train': 1.3108569383621216} +11/06/2021 23:01:00 - INFO - __main__ - Step 12802: {'lr': 0.0004934579930415751, 'samples': 2457984, 'steps': 12801, 'loss/train': 1.9333668947219849} +11/06/2021 23:01:00 - INFO - __main__ - Step 12803: {'lr': 0.0004934567869271751, 'samples': 2458176, 'steps': 12802, 'loss/train': 1.9801455736160278} +11/06/2021 23:01:01 - INFO - __main__ - Step 12804: {'lr': 0.0004934555807030774, 'samples': 2458368, 'steps': 12803, 'loss/train': 1.053701400756836} +11/06/2021 23:01:02 - INFO - __main__ - Step 12805: {'lr': 0.0004934543743692822, 'samples': 2458560, 'steps': 12804, 'loss/train': 1.4716850519180298} +11/06/2021 23:01:02 - INFO - __main__ - Step 12806: {'lr': 0.0004934531679257903, 'samples': 2458752, 'steps': 12805, 'loss/train': 1.5304038524627686} +11/06/2021 23:01:03 - INFO - __main__ - Step 12807: {'lr': 0.0004934519613726022, 'samples': 2458944, 'steps': 12806, 'loss/train': 1.6712217330932617} +11/06/2021 23:01:03 - INFO - __main__ - Step 12808: {'lr': 0.0004934507547097183, 'samples': 2459136, 'steps': 12807, 'loss/train': 1.6593072414398193} +11/06/2021 23:01:03 - INFO - __main__ - Step 12809: {'lr': 0.0004934495479371393, 'samples': 2459328, 'steps': 12808, 'loss/train': 4.7572102546691895} +11/06/2021 23:01:04 - INFO - __main__ - Step 12810: {'lr': 0.0004934483410548658, 'samples': 2459520, 'steps': 12809, 'loss/train': 0.9556400775909424} +11/06/2021 23:01:05 - INFO - __main__ - Step 12811: {'lr': 0.0004934471340628981, 'samples': 2459712, 'steps': 12810, 'loss/train': 0.8056848049163818} +11/06/2021 23:01:05 - INFO - __main__ - Step 12812: {'lr': 0.000493445926961237, 'samples': 2459904, 'steps': 12811, 'loss/train': 1.6957072019577026} +11/06/2021 23:01:05 - INFO - __main__ - Step 12813: {'lr': 0.0004934447197498828, 'samples': 2460096, 'steps': 12812, 'loss/train': 1.9989805221557617} +11/06/2021 23:01:06 - INFO - __main__ - Step 12814: {'lr': 0.0004934435124288362, 'samples': 2460288, 'steps': 12813, 'loss/train': 2.132337808609009} +11/06/2021 23:01:07 - INFO - __main__ - Step 12815: {'lr': 0.0004934423049980977, 'samples': 2460480, 'steps': 12814, 'loss/train': 1.7412266731262207} +11/06/2021 23:01:07 - INFO - __main__ - Step 12816: {'lr': 0.0004934410974576679, 'samples': 2460672, 'steps': 12815, 'loss/train': 1.9368259906768799} +11/06/2021 23:01:07 - INFO - __main__ - Step 12817: {'lr': 0.0004934398898075472, 'samples': 2460864, 'steps': 12816, 'loss/train': 1.8307538032531738} +11/06/2021 23:01:08 - INFO - __main__ - Step 12818: {'lr': 0.0004934386820477363, 'samples': 2461056, 'steps': 12817, 'loss/train': 1.4713562726974487} +11/06/2021 23:01:08 - INFO - __main__ - Step 12819: {'lr': 0.0004934374741782357, 'samples': 2461248, 'steps': 12818, 'loss/train': 1.4008110761642456} +11/06/2021 23:01:09 - INFO - __main__ - Step 12820: {'lr': 0.000493436266199046, 'samples': 2461440, 'steps': 12819, 'loss/train': 1.4729948043823242} +11/06/2021 23:01:09 - INFO - __main__ - Step 12821: {'lr': 0.0004934350581101676, 'samples': 2461632, 'steps': 12820, 'loss/train': 1.7127310037612915} +11/06/2021 23:01:10 - INFO - __main__ - Step 12822: {'lr': 0.0004934338499116011, 'samples': 2461824, 'steps': 12821, 'loss/train': 1.610058307647705} +11/06/2021 23:01:10 - INFO - __main__ - Step 12823: {'lr': 0.0004934326416033471, 'samples': 2462016, 'steps': 12822, 'loss/train': 1.9114627838134766} +11/06/2021 23:01:10 - INFO - __main__ - Step 12824: {'lr': 0.0004934314331854061, 'samples': 2462208, 'steps': 12823, 'loss/train': 1.826889157295227} +11/06/2021 23:01:12 - INFO - __main__ - Step 12825: {'lr': 0.0004934302246577786, 'samples': 2462400, 'steps': 12824, 'loss/train': 1.7399663925170898} +11/06/2021 23:01:12 - INFO - __main__ - Step 12826: {'lr': 0.0004934290160204652, 'samples': 2462592, 'steps': 12825, 'loss/train': 1.5818183422088623} +11/06/2021 23:01:12 - INFO - __main__ - Step 12827: {'lr': 0.0004934278072734666, 'samples': 2462784, 'steps': 12826, 'loss/train': 1.4330865144729614} +11/06/2021 23:01:13 - INFO - __main__ - Step 12828: {'lr': 0.000493426598416783, 'samples': 2462976, 'steps': 12827, 'loss/train': 1.77826988697052} +11/06/2021 23:01:13 - INFO - __main__ - Step 12829: {'lr': 0.0004934253894504152, 'samples': 2463168, 'steps': 12828, 'loss/train': 1.1493207216262817} +11/06/2021 23:01:14 - INFO - __main__ - Step 12830: {'lr': 0.0004934241803743637, 'samples': 2463360, 'steps': 12829, 'loss/train': 1.8719111680984497} +11/06/2021 23:01:14 - INFO - __main__ - Step 12831: {'lr': 0.000493422971188629, 'samples': 2463552, 'steps': 12830, 'loss/train': 1.228978157043457} +11/06/2021 23:01:15 - INFO - __main__ - Step 12832: {'lr': 0.0004934217618932117, 'samples': 2463744, 'steps': 12831, 'loss/train': 1.8399741649627686} +11/06/2021 23:01:15 - INFO - __main__ - Step 12833: {'lr': 0.0004934205524881123, 'samples': 2463936, 'steps': 12832, 'loss/train': 1.9681713581085205} +11/06/2021 23:01:15 - INFO - __main__ - Step 12834: {'lr': 0.0004934193429733312, 'samples': 2464128, 'steps': 12833, 'loss/train': 0.9652214050292969} +11/06/2021 23:01:17 - INFO - __main__ - Step 12835: {'lr': 0.0004934181333488693, 'samples': 2464320, 'steps': 12834, 'loss/train': 1.6454654932022095} +11/06/2021 23:01:18 - INFO - __main__ - Step 12836: {'lr': 0.0004934169236147268, 'samples': 2464512, 'steps': 12835, 'loss/train': 1.410776138305664} +11/06/2021 23:01:18 - INFO - __main__ - Step 12837: {'lr': 0.0004934157137709044, 'samples': 2464704, 'steps': 12836, 'loss/train': 1.5523715019226074} +11/06/2021 23:01:18 - INFO - __main__ - Step 12838: {'lr': 0.0004934145038174028, 'samples': 2464896, 'steps': 12837, 'loss/train': 1.6767199039459229} +11/06/2021 23:01:19 - INFO - __main__ - Step 12839: {'lr': 0.0004934132937542223, 'samples': 2465088, 'steps': 12838, 'loss/train': 1.64377760887146} +11/06/2021 23:01:19 - INFO - __main__ - Step 12840: {'lr': 0.0004934120835813634, 'samples': 2465280, 'steps': 12839, 'loss/train': 5.639301776885986} +11/06/2021 23:01:19 - INFO - __main__ - Step 12841: {'lr': 0.0004934108732988269, 'samples': 2465472, 'steps': 12840, 'loss/train': 5.523209095001221} +11/06/2021 23:01:20 - INFO - __main__ - Step 12842: {'lr': 0.0004934096629066133, 'samples': 2465664, 'steps': 12841, 'loss/train': 5.597353458404541} +11/06/2021 23:01:21 - INFO - __main__ - Step 12843: {'lr': 0.0004934084524047229, 'samples': 2465856, 'steps': 12842, 'loss/train': 2.109654188156128} +11/06/2021 23:01:21 - INFO - __main__ - Step 12844: {'lr': 0.0004934072417931564, 'samples': 2466048, 'steps': 12843, 'loss/train': 1.7585923671722412} +11/06/2021 23:01:22 - INFO - __main__ - Step 12845: {'lr': 0.0004934060310719145, 'samples': 2466240, 'steps': 12844, 'loss/train': 1.6276121139526367} +11/06/2021 23:01:22 - INFO - __main__ - Step 12846: {'lr': 0.0004934048202409974, 'samples': 2466432, 'steps': 12845, 'loss/train': 1.8930996656417847} +11/06/2021 23:01:22 - INFO - __main__ - Step 12847: {'lr': 0.000493403609300406, 'samples': 2466624, 'steps': 12846, 'loss/train': 1.744299054145813} +11/06/2021 23:01:23 - INFO - __main__ - Step 12848: {'lr': 0.0004934023982501406, 'samples': 2466816, 'steps': 12847, 'loss/train': 1.2807785272598267} +11/06/2021 23:01:24 - INFO - __main__ - Step 12849: {'lr': 0.000493401187090202, 'samples': 2467008, 'steps': 12848, 'loss/train': 1.8994098901748657} +11/06/2021 23:01:24 - INFO - __main__ - Step 12850: {'lr': 0.0004933999758205904, 'samples': 2467200, 'steps': 12849, 'loss/train': 1.5451972484588623} +11/06/2021 23:01:24 - INFO - __main__ - Step 12851: {'lr': 0.0004933987644413066, 'samples': 2467392, 'steps': 12850, 'loss/train': 1.0521020889282227} +11/06/2021 23:01:25 - INFO - __main__ - Step 12852: {'lr': 0.0004933975529523511, 'samples': 2467584, 'steps': 12851, 'loss/train': 1.6571444272994995} +11/06/2021 23:01:26 - INFO - __main__ - Step 12853: {'lr': 0.0004933963413537244, 'samples': 2467776, 'steps': 12852, 'loss/train': 1.570617437362671} +11/06/2021 23:01:26 - INFO - __main__ - Step 12854: {'lr': 0.000493395129645427, 'samples': 2467968, 'steps': 12853, 'loss/train': 0.8766611218452454} +11/06/2021 23:01:26 - INFO - __main__ - Step 12855: {'lr': 0.0004933939178274596, 'samples': 2468160, 'steps': 12854, 'loss/train': 1.5354561805725098} +11/06/2021 23:01:27 - INFO - __main__ - Step 12856: {'lr': 0.0004933927058998226, 'samples': 2468352, 'steps': 12855, 'loss/train': 1.74991774559021} +11/06/2021 23:01:27 - INFO - __main__ - Step 12857: {'lr': 0.0004933914938625166, 'samples': 2468544, 'steps': 12856, 'loss/train': 1.6767778396606445} +11/06/2021 23:01:28 - INFO - __main__ - Step 12858: {'lr': 0.0004933902817155422, 'samples': 2468736, 'steps': 12857, 'loss/train': 1.899521827697754} +11/06/2021 23:01:29 - INFO - __main__ - Step 12859: {'lr': 0.0004933890694588998, 'samples': 2468928, 'steps': 12858, 'loss/train': 1.837016224861145} +11/06/2021 23:01:29 - INFO - __main__ - Step 12860: {'lr': 0.0004933878570925901, 'samples': 2469120, 'steps': 12859, 'loss/train': 1.6478303670883179} +11/06/2021 23:01:29 - INFO - __main__ - Step 12861: {'lr': 0.0004933866446166136, 'samples': 2469312, 'steps': 12860, 'loss/train': 1.84537935256958} +11/06/2021 23:01:30 - INFO - __main__ - Step 12862: {'lr': 0.0004933854320309708, 'samples': 2469504, 'steps': 12861, 'loss/train': 2.0039706230163574} +11/06/2021 23:01:31 - INFO - __main__ - Step 12863: {'lr': 0.0004933842193356624, 'samples': 2469696, 'steps': 12862, 'loss/train': 2.835719585418701} +11/06/2021 23:01:31 - INFO - __main__ - Step 12864: {'lr': 0.0004933830065306887, 'samples': 2469888, 'steps': 12863, 'loss/train': 2.0461788177490234} +11/06/2021 23:01:31 - INFO - __main__ - Step 12865: {'lr': 0.0004933817936160504, 'samples': 2470080, 'steps': 12864, 'loss/train': 1.4113506078720093} +11/06/2021 23:01:32 - INFO - __main__ - Step 12866: {'lr': 0.0004933805805917479, 'samples': 2470272, 'steps': 12865, 'loss/train': 1.4473645687103271} +11/06/2021 23:01:32 - INFO - __main__ - Step 12867: {'lr': 0.000493379367457782, 'samples': 2470464, 'steps': 12866, 'loss/train': 1.7717403173446655} +11/06/2021 23:01:32 - INFO - __main__ - Step 12868: {'lr': 0.0004933781542141532, 'samples': 2470656, 'steps': 12867, 'loss/train': 1.985740303993225} +11/06/2021 23:01:34 - INFO - __main__ - Step 12869: {'lr': 0.0004933769408608618, 'samples': 2470848, 'steps': 12868, 'loss/train': 1.6742669343948364} +11/06/2021 23:01:34 - INFO - __main__ - Step 12870: {'lr': 0.0004933757273979086, 'samples': 2471040, 'steps': 12869, 'loss/train': 0.415326327085495} +11/06/2021 23:01:34 - INFO - __main__ - Step 12871: {'lr': 0.0004933745138252939, 'samples': 2471232, 'steps': 12870, 'loss/train': 1.893794298171997} +11/06/2021 23:01:35 - INFO - __main__ - Step 12872: {'lr': 0.0004933733001430186, 'samples': 2471424, 'steps': 12871, 'loss/train': 1.7198106050491333} +11/06/2021 23:01:35 - INFO - __main__ - Step 12873: {'lr': 0.000493372086351083, 'samples': 2471616, 'steps': 12872, 'loss/train': 2.0763978958129883} +11/06/2021 23:01:36 - INFO - __main__ - Step 12874: {'lr': 0.0004933708724494877, 'samples': 2471808, 'steps': 12873, 'loss/train': 1.426766276359558} +11/06/2021 23:01:36 - INFO - __main__ - Step 12875: {'lr': 0.0004933696584382331, 'samples': 2472000, 'steps': 12874, 'loss/train': 1.5616261959075928} +11/06/2021 23:01:37 - INFO - __main__ - Step 12876: {'lr': 0.00049336844431732, 'samples': 2472192, 'steps': 12875, 'loss/train': 1.1413694620132446} +11/06/2021 23:01:37 - INFO - __main__ - Step 12877: {'lr': 0.0004933672300867488, 'samples': 2472384, 'steps': 12876, 'loss/train': 1.5705578327178955} +11/06/2021 23:01:37 - INFO - __main__ - Step 12878: {'lr': 0.0004933660157465202, 'samples': 2472576, 'steps': 12877, 'loss/train': 1.6181583404541016} +11/06/2021 23:01:39 - INFO - __main__ - Step 12879: {'lr': 0.0004933648012966344, 'samples': 2472768, 'steps': 12878, 'loss/train': 2.557011842727661} +11/06/2021 23:01:39 - INFO - __main__ - Step 12880: {'lr': 0.0004933635867370923, 'samples': 2472960, 'steps': 12879, 'loss/train': 1.745104193687439} +11/06/2021 23:01:39 - INFO - __main__ - Step 12881: {'lr': 0.0004933623720678944, 'samples': 2473152, 'steps': 12880, 'loss/train': 1.816332459449768} +11/06/2021 23:01:40 - INFO - __main__ - Step 12882: {'lr': 0.000493361157289041, 'samples': 2473344, 'steps': 12881, 'loss/train': 1.7329145669937134} +11/06/2021 23:01:40 - INFO - __main__ - Step 12883: {'lr': 0.000493359942400533, 'samples': 2473536, 'steps': 12882, 'loss/train': 1.764685034751892} +11/06/2021 23:01:41 - INFO - __main__ - Step 12884: {'lr': 0.0004933587274023706, 'samples': 2473728, 'steps': 12883, 'loss/train': 1.9591374397277832} +11/06/2021 23:01:41 - INFO - __main__ - Step 12885: {'lr': 0.0004933575122945547, 'samples': 2473920, 'steps': 12884, 'loss/train': 1.8801758289337158} +11/06/2021 23:01:42 - INFO - __main__ - Step 12886: {'lr': 0.0004933562970770855, 'samples': 2474112, 'steps': 12885, 'loss/train': 1.7536741495132446} +11/06/2021 23:01:42 - INFO - __main__ - Step 12887: {'lr': 0.0004933550817499638, 'samples': 2474304, 'steps': 12886, 'loss/train': 1.2631752490997314} +11/06/2021 23:01:42 - INFO - __main__ - Step 12888: {'lr': 0.00049335386631319, 'samples': 2474496, 'steps': 12887, 'loss/train': 2.017979621887207} +11/06/2021 23:01:43 - INFO - __main__ - Step 12889: {'lr': 0.0004933526507667648, 'samples': 2474688, 'steps': 12888, 'loss/train': 2.223954200744629} +11/06/2021 23:01:44 - INFO - __main__ - Step 12890: {'lr': 0.0004933514351106885, 'samples': 2474880, 'steps': 12889, 'loss/train': 1.3178850412368774} +11/06/2021 23:01:44 - INFO - __main__ - Step 12891: {'lr': 0.0004933502193449618, 'samples': 2475072, 'steps': 12890, 'loss/train': 1.6767654418945312} +11/06/2021 23:01:44 - INFO - __main__ - Step 12892: {'lr': 0.0004933490034695853, 'samples': 2475264, 'steps': 12891, 'loss/train': 1.598570466041565} +11/06/2021 23:01:45 - INFO - __main__ - Step 12893: {'lr': 0.0004933477874845595, 'samples': 2475456, 'steps': 12892, 'loss/train': 1.9039117097854614} +11/06/2021 23:01:46 - INFO - __main__ - Step 12894: {'lr': 0.000493346571389885, 'samples': 2475648, 'steps': 12893, 'loss/train': 1.4883739948272705} +11/06/2021 23:01:46 - INFO - __main__ - Step 12895: {'lr': 0.0004933453551855622, 'samples': 2475840, 'steps': 12894, 'loss/train': 1.6035698652267456} +11/06/2021 23:01:47 - INFO - __main__ - Step 12896: {'lr': 0.0004933441388715919, 'samples': 2476032, 'steps': 12895, 'loss/train': 1.7423779964447021} +11/06/2021 23:01:47 - INFO - __main__ - Step 12897: {'lr': 0.0004933429224479743, 'samples': 2476224, 'steps': 12896, 'loss/train': 1.6877235174179077} +11/06/2021 23:01:48 - INFO - __main__ - Step 12898: {'lr': 0.0004933417059147102, 'samples': 2476416, 'steps': 12897, 'loss/train': 1.5222456455230713} +11/06/2021 23:01:48 - INFO - __main__ - Step 12899: {'lr': 0.0004933404892718, 'samples': 2476608, 'steps': 12898, 'loss/train': 0.5296525955200195} +11/06/2021 23:01:50 - INFO - __main__ - Step 12900: {'lr': 0.0004933392725192444, 'samples': 2476800, 'steps': 12899, 'loss/train': 2.3114047050476074} +11/06/2021 23:01:50 - INFO - __main__ - Step 12901: {'lr': 0.000493338055657044, 'samples': 2476992, 'steps': 12900, 'loss/train': 1.6073651313781738} +11/06/2021 23:01:50 - INFO - __main__ - Step 12902: {'lr': 0.0004933368386851991, 'samples': 2477184, 'steps': 12901, 'loss/train': 0.23120321333408356} +11/06/2021 23:01:51 - INFO - __main__ - Step 12903: {'lr': 0.0004933356216037104, 'samples': 2477376, 'steps': 12902, 'loss/train': 1.398972749710083} +11/06/2021 23:01:51 - INFO - __main__ - Step 12904: {'lr': 0.0004933344044125784, 'samples': 2477568, 'steps': 12903, 'loss/train': 1.585076093673706} +11/06/2021 23:01:52 - INFO - __main__ - Step 12905: {'lr': 0.0004933331871118037, 'samples': 2477760, 'steps': 12904, 'loss/train': 1.9329192638397217} +11/06/2021 23:01:52 - INFO - __main__ - Step 12906: {'lr': 0.0004933319697013869, 'samples': 2477952, 'steps': 12905, 'loss/train': 1.082170844078064} +11/06/2021 23:01:53 - INFO - __main__ - Step 12907: {'lr': 0.0004933307521813282, 'samples': 2478144, 'steps': 12906, 'loss/train': 1.3846449851989746} +11/06/2021 23:01:53 - INFO - __main__ - Step 12908: {'lr': 0.0004933295345516287, 'samples': 2478336, 'steps': 12907, 'loss/train': 1.5094048976898193} +11/06/2021 23:01:53 - INFO - __main__ - Step 12909: {'lr': 0.0004933283168122886, 'samples': 2478528, 'steps': 12908, 'loss/train': 1.7825679779052734} +11/06/2021 23:01:54 - INFO - __main__ - Step 12910: {'lr': 0.0004933270989633084, 'samples': 2478720, 'steps': 12909, 'loss/train': 2.0155463218688965} +11/06/2021 23:01:55 - INFO - __main__ - Step 12911: {'lr': 0.0004933258810046889, 'samples': 2478912, 'steps': 12910, 'loss/train': 1.8153250217437744} +11/06/2021 23:01:55 - INFO - __main__ - Step 12912: {'lr': 0.0004933246629364304, 'samples': 2479104, 'steps': 12911, 'loss/train': 1.8701039552688599} +11/06/2021 23:01:55 - INFO - __main__ - Step 12913: {'lr': 0.0004933234447585337, 'samples': 2479296, 'steps': 12912, 'loss/train': 1.6900960206985474} +11/06/2021 23:01:56 - INFO - __main__ - Step 12914: {'lr': 0.0004933222264709991, 'samples': 2479488, 'steps': 12913, 'loss/train': 1.2670124769210815} +11/06/2021 23:01:57 - INFO - __main__ - Step 12915: {'lr': 0.0004933210080738273, 'samples': 2479680, 'steps': 12914, 'loss/train': 1.0174174308776855} +11/06/2021 23:01:57 - INFO - __main__ - Step 12916: {'lr': 0.0004933197895670187, 'samples': 2479872, 'steps': 12915, 'loss/train': 1.1427866220474243} +11/06/2021 23:01:58 - INFO - __main__ - Step 12917: {'lr': 0.0004933185709505741, 'samples': 2480064, 'steps': 12916, 'loss/train': 1.5414581298828125} +11/06/2021 23:01:58 - INFO - __main__ - Step 12918: {'lr': 0.0004933173522244939, 'samples': 2480256, 'steps': 12917, 'loss/train': 1.7401179075241089} +11/06/2021 23:01:58 - INFO - __main__ - Step 12919: {'lr': 0.0004933161333887786, 'samples': 2480448, 'steps': 12918, 'loss/train': 0.29492583870887756} +11/06/2021 23:02:00 - INFO - __main__ - Step 12920: {'lr': 0.0004933149144434288, 'samples': 2480640, 'steps': 12919, 'loss/train': 1.3319393396377563} +11/06/2021 23:02:00 - INFO - __main__ - Step 12921: {'lr': 0.0004933136953884451, 'samples': 2480832, 'steps': 12920, 'loss/train': 1.2883689403533936} +11/06/2021 23:02:00 - INFO - __main__ - Step 12922: {'lr': 0.0004933124762238279, 'samples': 2481024, 'steps': 12921, 'loss/train': 1.720632791519165} +11/06/2021 23:02:01 - INFO - __main__ - Step 12923: {'lr': 0.000493311256949578, 'samples': 2481216, 'steps': 12922, 'loss/train': 1.5766397714614868} +11/06/2021 23:02:01 - INFO - __main__ - Step 12924: {'lr': 0.0004933100375656957, 'samples': 2481408, 'steps': 12923, 'loss/train': 1.3622182607650757} +11/06/2021 23:02:02 - INFO - __main__ - Step 12925: {'lr': 0.0004933088180721817, 'samples': 2481600, 'steps': 12924, 'loss/train': 1.876354694366455} +11/06/2021 23:02:02 - INFO - __main__ - Step 12926: {'lr': 0.0004933075984690365, 'samples': 2481792, 'steps': 12925, 'loss/train': 1.9899784326553345} +11/06/2021 23:02:03 - INFO - __main__ - Step 12927: {'lr': 0.0004933063787562606, 'samples': 2481984, 'steps': 12926, 'loss/train': 1.0341933965682983} +11/06/2021 23:02:03 - INFO - __main__ - Step 12928: {'lr': 0.0004933051589338547, 'samples': 2482176, 'steps': 12927, 'loss/train': 1.815047025680542} +11/06/2021 23:02:03 - INFO - __main__ - Step 12929: {'lr': 0.0004933039390018192, 'samples': 2482368, 'steps': 12928, 'loss/train': 1.346707820892334} +11/06/2021 23:02:04 - INFO - __main__ - Step 12930: {'lr': 0.0004933027189601547, 'samples': 2482560, 'steps': 12929, 'loss/train': 1.6749612092971802} +11/06/2021 23:02:05 - INFO - __main__ - Step 12931: {'lr': 0.0004933014988088616, 'samples': 2482752, 'steps': 12930, 'loss/train': 1.7851786613464355} +11/06/2021 23:02:05 - INFO - __main__ - Step 12932: {'lr': 0.0004933002785479408, 'samples': 2482944, 'steps': 12931, 'loss/train': 1.2040504217147827} +11/06/2021 23:02:06 - INFO - __main__ - Step 12933: {'lr': 0.0004932990581773926, 'samples': 2483136, 'steps': 12932, 'loss/train': 1.582513451576233} +11/06/2021 23:02:06 - INFO - __main__ - Step 12934: {'lr': 0.0004932978376972175, 'samples': 2483328, 'steps': 12933, 'loss/train': 0.32476386427879333} +11/06/2021 23:02:06 - INFO - __main__ - Step 12935: {'lr': 0.0004932966171074163, 'samples': 2483520, 'steps': 12934, 'loss/train': 1.2251867055892944} +11/06/2021 23:02:07 - INFO - __main__ - Step 12936: {'lr': 0.0004932953964079893, 'samples': 2483712, 'steps': 12935, 'loss/train': 1.569036841392517} +11/06/2021 23:02:08 - INFO - __main__ - Step 12937: {'lr': 0.0004932941755989372, 'samples': 2483904, 'steps': 12936, 'loss/train': 1.9879359006881714} +11/06/2021 23:02:08 - INFO - __main__ - Step 12938: {'lr': 0.0004932929546802605, 'samples': 2484096, 'steps': 12937, 'loss/train': 1.4933514595031738} +11/06/2021 23:02:08 - INFO - __main__ - Step 12939: {'lr': 0.0004932917336519597, 'samples': 2484288, 'steps': 12938, 'loss/train': 1.2084016799926758} +11/06/2021 23:02:09 - INFO - __main__ - Step 12940: {'lr': 0.0004932905125140354, 'samples': 2484480, 'steps': 12939, 'loss/train': 1.5175234079360962} +11/06/2021 23:02:10 - INFO - __main__ - Step 12941: {'lr': 0.0004932892912664882, 'samples': 2484672, 'steps': 12940, 'loss/train': 1.7356916666030884} +11/06/2021 23:02:10 - INFO - __main__ - Step 12942: {'lr': 0.0004932880699093186, 'samples': 2484864, 'steps': 12941, 'loss/train': 1.6481016874313354} +11/06/2021 23:02:10 - INFO - __main__ - Step 12943: {'lr': 0.0004932868484425271, 'samples': 2485056, 'steps': 12942, 'loss/train': 1.8215060234069824} +11/06/2021 23:02:11 - INFO - __main__ - Step 12944: {'lr': 0.0004932856268661143, 'samples': 2485248, 'steps': 12943, 'loss/train': 1.5122387409210205} +11/06/2021 23:02:11 - INFO - __main__ - Step 12945: {'lr': 0.0004932844051800808, 'samples': 2485440, 'steps': 12944, 'loss/train': 1.9089007377624512} +11/06/2021 23:02:12 - INFO - __main__ - Step 12946: {'lr': 0.000493283183384427, 'samples': 2485632, 'steps': 12945, 'loss/train': 1.1102064847946167} +11/06/2021 23:02:13 - INFO - __main__ - Step 12947: {'lr': 0.0004932819614791537, 'samples': 2485824, 'steps': 12946, 'loss/train': 1.6587165594100952} +11/06/2021 23:02:13 - INFO - __main__ - Step 12948: {'lr': 0.0004932807394642612, 'samples': 2486016, 'steps': 12947, 'loss/train': 1.7909165620803833} +11/06/2021 23:02:13 - INFO - __main__ - Step 12949: {'lr': 0.0004932795173397501, 'samples': 2486208, 'steps': 12948, 'loss/train': 2.574796199798584} +11/06/2021 23:02:14 - INFO - __main__ - Step 12950: {'lr': 0.0004932782951056211, 'samples': 2486400, 'steps': 12949, 'loss/train': 2.0372557640075684} +11/06/2021 23:02:15 - INFO - __main__ - Step 12951: {'lr': 0.0004932770727618747, 'samples': 2486592, 'steps': 12950, 'loss/train': 3.691620349884033} +11/06/2021 23:02:15 - INFO - __main__ - Step 12952: {'lr': 0.0004932758503085114, 'samples': 2486784, 'steps': 12951, 'loss/train': 1.6988760232925415} +11/06/2021 23:02:15 - INFO - __main__ - Step 12953: {'lr': 0.0004932746277455317, 'samples': 2486976, 'steps': 12952, 'loss/train': 1.674808382987976} +11/06/2021 23:02:16 - INFO - __main__ - Step 12954: {'lr': 0.0004932734050729362, 'samples': 2487168, 'steps': 12953, 'loss/train': 1.2582000494003296} +11/06/2021 23:02:16 - INFO - __main__ - Step 12955: {'lr': 0.0004932721822907255, 'samples': 2487360, 'steps': 12954, 'loss/train': 1.9092744588851929} +11/06/2021 23:02:17 - INFO - __main__ - Step 12956: {'lr': 0.0004932709593989, 'samples': 2487552, 'steps': 12955, 'loss/train': 0.7507480978965759} +11/06/2021 23:02:17 - INFO - __main__ - Step 12957: {'lr': 0.0004932697363974604, 'samples': 2487744, 'steps': 12956, 'loss/train': 1.7332943677902222} +11/06/2021 23:02:18 - INFO - __main__ - Step 12958: {'lr': 0.0004932685132864072, 'samples': 2487936, 'steps': 12957, 'loss/train': 1.3571699857711792} +11/06/2021 23:02:18 - INFO - __main__ - Step 12959: {'lr': 0.0004932672900657411, 'samples': 2488128, 'steps': 12958, 'loss/train': 1.7823020219802856} +11/06/2021 23:02:18 - INFO - __main__ - Step 12960: {'lr': 0.0004932660667354623, 'samples': 2488320, 'steps': 12959, 'loss/train': 1.8756752014160156} +11/06/2021 23:02:20 - INFO - __main__ - Step 12961: {'lr': 0.0004932648432955717, 'samples': 2488512, 'steps': 12960, 'loss/train': 1.2283211946487427} +11/06/2021 23:02:20 - INFO - __main__ - Step 12962: {'lr': 0.0004932636197460698, 'samples': 2488704, 'steps': 12961, 'loss/train': 1.6361844539642334} +11/06/2021 23:02:20 - INFO - __main__ - Step 12963: {'lr': 0.0004932623960869569, 'samples': 2488896, 'steps': 12962, 'loss/train': 2.1100404262542725} +11/06/2021 23:02:21 - INFO - __main__ - Step 12964: {'lr': 0.0004932611723182338, 'samples': 2489088, 'steps': 12963, 'loss/train': 2.5909249782562256} +11/06/2021 23:02:21 - INFO - __main__ - Step 12965: {'lr': 0.000493259948439901, 'samples': 2489280, 'steps': 12964, 'loss/train': 1.8154479265213013} +11/06/2021 23:02:21 - INFO - __main__ - Step 12966: {'lr': 0.0004932587244519589, 'samples': 2489472, 'steps': 12965, 'loss/train': 1.5690723657608032} +11/06/2021 23:02:22 - INFO - __main__ - Step 12967: {'lr': 0.0004932575003544083, 'samples': 2489664, 'steps': 12966, 'loss/train': 1.8327417373657227} +11/06/2021 23:02:23 - INFO - __main__ - Step 12968: {'lr': 0.0004932562761472496, 'samples': 2489856, 'steps': 12967, 'loss/train': 1.6555702686309814} +11/06/2021 23:02:23 - INFO - __main__ - Step 12969: {'lr': 0.0004932550518304833, 'samples': 2490048, 'steps': 12968, 'loss/train': 1.708749532699585} +11/06/2021 23:02:23 - INFO - __main__ - Step 12970: {'lr': 0.0004932538274041101, 'samples': 2490240, 'steps': 12969, 'loss/train': 1.741576910018921} +11/06/2021 23:02:24 - INFO - __main__ - Step 12971: {'lr': 0.0004932526028681304, 'samples': 2490432, 'steps': 12970, 'loss/train': 1.9435254335403442} +11/06/2021 23:02:25 - INFO - __main__ - Step 12972: {'lr': 0.0004932513782225449, 'samples': 2490624, 'steps': 12971, 'loss/train': 1.1495224237442017} +11/06/2021 23:02:26 - INFO - __main__ - Step 12973: {'lr': 0.000493250153467354, 'samples': 2490816, 'steps': 12972, 'loss/train': 1.953014850616455} +11/06/2021 23:02:26 - INFO - __main__ - Step 12974: {'lr': 0.0004932489286025584, 'samples': 2491008, 'steps': 12973, 'loss/train': 1.809768557548523} +11/06/2021 23:02:26 - INFO - __main__ - Step 12975: {'lr': 0.0004932477036281586, 'samples': 2491200, 'steps': 12974, 'loss/train': 1.7049349546432495} +11/06/2021 23:02:27 - INFO - __main__ - Step 12976: {'lr': 0.0004932464785441552, 'samples': 2491392, 'steps': 12975, 'loss/train': 1.7377121448516846} +11/06/2021 23:02:27 - INFO - __main__ - Step 12977: {'lr': 0.0004932452533505486, 'samples': 2491584, 'steps': 12976, 'loss/train': 1.471701979637146} +11/06/2021 23:02:27 - INFO - __main__ - Step 12978: {'lr': 0.0004932440280473395, 'samples': 2491776, 'steps': 12977, 'loss/train': 1.8254519701004028} +11/06/2021 23:02:28 - INFO - __main__ - Step 12979: {'lr': 0.0004932428026345282, 'samples': 2491968, 'steps': 12978, 'loss/train': 1.869467854499817} +11/06/2021 23:02:29 - INFO - __main__ - Step 12980: {'lr': 0.0004932415771121157, 'samples': 2492160, 'steps': 12979, 'loss/train': 2.1289100646972656} +11/06/2021 23:02:29 - INFO - __main__ - Step 12981: {'lr': 0.0004932403514801021, 'samples': 2492352, 'steps': 12980, 'loss/train': 1.9706026315689087} +11/06/2021 23:02:29 - INFO - __main__ - Step 12982: {'lr': 0.0004932391257384883, 'samples': 2492544, 'steps': 12981, 'loss/train': 1.9861183166503906} +11/06/2021 23:02:30 - INFO - __main__ - Step 12983: {'lr': 0.0004932378998872746, 'samples': 2492736, 'steps': 12982, 'loss/train': 2.142361640930176} +11/06/2021 23:02:31 - INFO - __main__ - Step 12984: {'lr': 0.0004932366739264618, 'samples': 2492928, 'steps': 12983, 'loss/train': 0.2792867422103882} +11/06/2021 23:02:31 - INFO - __main__ - Step 12985: {'lr': 0.0004932354478560502, 'samples': 2493120, 'steps': 12984, 'loss/train': 1.9411041736602783} +11/06/2021 23:02:31 - INFO - __main__ - Step 12986: {'lr': 0.0004932342216760405, 'samples': 2493312, 'steps': 12985, 'loss/train': 1.882585883140564} +11/06/2021 23:02:32 - INFO - __main__ - Step 12987: {'lr': 0.0004932329953864331, 'samples': 2493504, 'steps': 12986, 'loss/train': 1.9840530157089233} +11/06/2021 23:02:32 - INFO - __main__ - Step 12988: {'lr': 0.0004932317689872287, 'samples': 2493696, 'steps': 12987, 'loss/train': 1.5482817888259888} +11/06/2021 23:02:33 - INFO - __main__ - Step 12989: {'lr': 0.000493230542478428, 'samples': 2493888, 'steps': 12988, 'loss/train': 1.229072093963623} +11/06/2021 23:02:34 - INFO - __main__ - Step 12990: {'lr': 0.0004932293158600312, 'samples': 2494080, 'steps': 12989, 'loss/train': 2.037853717803955} +11/06/2021 23:02:34 - INFO - __main__ - Step 12991: {'lr': 0.0004932280891320391, 'samples': 2494272, 'steps': 12990, 'loss/train': 1.9727879762649536} +11/06/2021 23:02:34 - INFO - __main__ - Step 12992: {'lr': 0.0004932268622944521, 'samples': 2494464, 'steps': 12991, 'loss/train': 2.1666083335876465} +11/06/2021 23:02:35 - INFO - __main__ - Step 12993: {'lr': 0.0004932256353472709, 'samples': 2494656, 'steps': 12992, 'loss/train': 1.4905357360839844} +11/06/2021 23:02:36 - INFO - __main__ - Step 12994: {'lr': 0.0004932244082904959, 'samples': 2494848, 'steps': 12993, 'loss/train': 1.4867180585861206} +11/06/2021 23:02:36 - INFO - __main__ - Step 12995: {'lr': 0.0004932231811241278, 'samples': 2495040, 'steps': 12994, 'loss/train': 0.779282808303833} +11/06/2021 23:02:36 - INFO - __main__ - Step 12996: {'lr': 0.0004932219538481672, 'samples': 2495232, 'steps': 12995, 'loss/train': 1.931758165359497} +11/06/2021 23:02:37 - INFO - __main__ - Step 12997: {'lr': 0.0004932207264626143, 'samples': 2495424, 'steps': 12996, 'loss/train': 1.4099301099777222} +11/06/2021 23:02:37 - INFO - __main__ - Step 12998: {'lr': 0.00049321949896747, 'samples': 2495616, 'steps': 12997, 'loss/train': 1.4822603464126587} +11/06/2021 23:02:39 - INFO - __main__ - Step 12999: {'lr': 0.0004932182713627348, 'samples': 2495808, 'steps': 12998, 'loss/train': 1.0354619026184082} +11/06/2021 23:02:39 - INFO - __main__ - Step 13000: {'lr': 0.0004932170436484091, 'samples': 2496000, 'steps': 12999, 'loss/train': 0.504642903804779} +11/06/2021 23:02:39 - INFO - __main__ - Step 13001: {'lr': 0.0004932158158244937, 'samples': 2496192, 'steps': 13000, 'loss/train': 0.3501379191875458} +11/06/2021 23:02:40 - INFO - __main__ - Step 13002: {'lr': 0.0004932145878909889, 'samples': 2496384, 'steps': 13001, 'loss/train': 1.9297839403152466} +11/06/2021 23:02:40 - INFO - __main__ - Step 13003: {'lr': 0.0004932133598478953, 'samples': 2496576, 'steps': 13002, 'loss/train': 1.891198754310608} +11/06/2021 23:02:41 - INFO - __main__ - Step 13004: {'lr': 0.0004932121316952136, 'samples': 2496768, 'steps': 13003, 'loss/train': 1.5406192541122437} +11/06/2021 23:02:41 - INFO - __main__ - Step 13005: {'lr': 0.0004932109034329442, 'samples': 2496960, 'steps': 13004, 'loss/train': 1.6352239847183228} +11/06/2021 23:02:42 - INFO - __main__ - Step 13006: {'lr': 0.0004932096750610879, 'samples': 2497152, 'steps': 13005, 'loss/train': 1.8479753732681274} +11/06/2021 23:02:42 - INFO - __main__ - Step 13007: {'lr': 0.0004932084465796449, 'samples': 2497344, 'steps': 13006, 'loss/train': 1.7984743118286133} +11/06/2021 23:02:43 - INFO - __main__ - Step 13008: {'lr': 0.000493207217988616, 'samples': 2497536, 'steps': 13007, 'loss/train': 1.575510025024414} +11/06/2021 23:02:44 - INFO - __main__ - Step 13009: {'lr': 0.0004932059892880016, 'samples': 2497728, 'steps': 13008, 'loss/train': 1.1041618585586548} +11/06/2021 23:02:44 - INFO - __main__ - Step 13010: {'lr': 0.0004932047604778025, 'samples': 2497920, 'steps': 13009, 'loss/train': 0.6211431622505188} +11/06/2021 23:02:45 - INFO - __main__ - Step 13011: {'lr': 0.0004932035315580188, 'samples': 2498112, 'steps': 13010, 'loss/train': 2.066260576248169} +11/06/2021 23:02:45 - INFO - __main__ - Step 13012: {'lr': 0.0004932023025286516, 'samples': 2498304, 'steps': 13011, 'loss/train': 1.6674903631210327} +11/06/2021 23:02:45 - INFO - __main__ - Step 13013: {'lr': 0.0004932010733897012, 'samples': 2498496, 'steps': 13012, 'loss/train': 1.5579228401184082} +11/06/2021 23:02:46 - INFO - __main__ - Step 13014: {'lr': 0.000493199844141168, 'samples': 2498688, 'steps': 13013, 'loss/train': 1.8701536655426025} +11/06/2021 23:02:47 - INFO - __main__ - Step 13015: {'lr': 0.0004931986147830527, 'samples': 2498880, 'steps': 13014, 'loss/train': 1.726219654083252} +11/06/2021 23:02:47 - INFO - __main__ - Step 13016: {'lr': 0.000493197385315356, 'samples': 2499072, 'steps': 13015, 'loss/train': 1.4233412742614746} +11/06/2021 23:02:47 - INFO - __main__ - Step 13017: {'lr': 0.0004931961557380782, 'samples': 2499264, 'steps': 13016, 'loss/train': 1.2359046936035156} +11/06/2021 23:02:48 - INFO - __main__ - Step 13018: {'lr': 0.00049319492605122, 'samples': 2499456, 'steps': 13017, 'loss/train': 1.8722537755966187} +11/06/2021 23:02:48 - INFO - __main__ - Step 13019: {'lr': 0.000493193696254782, 'samples': 2499648, 'steps': 13018, 'loss/train': 1.5985851287841797} +11/06/2021 23:02:49 - INFO - __main__ - Step 13020: {'lr': 0.0004931924663487646, 'samples': 2499840, 'steps': 13019, 'loss/train': 1.6530154943466187} +11/06/2021 23:02:50 - INFO - __main__ - Step 13021: {'lr': 0.0004931912363331683, 'samples': 2500032, 'steps': 13020, 'loss/train': 1.8538419008255005} +11/06/2021 23:02:50 - INFO - __main__ - Step 13022: {'lr': 0.000493190006207994, 'samples': 2500224, 'steps': 13021, 'loss/train': 1.3083375692367554} +11/06/2021 23:02:50 - INFO - __main__ - Step 13023: {'lr': 0.0004931887759732419, 'samples': 2500416, 'steps': 13022, 'loss/train': 1.6392176151275635} +11/06/2021 23:02:51 - INFO - __main__ - Step 13024: {'lr': 0.0004931875456289128, 'samples': 2500608, 'steps': 13023, 'loss/train': 1.1660975217819214} +11/06/2021 23:02:52 - INFO - __main__ - Step 13025: {'lr': 0.000493186315175007, 'samples': 2500800, 'steps': 13024, 'loss/train': 1.6558512449264526} +11/06/2021 23:02:52 - INFO - __main__ - Step 13026: {'lr': 0.0004931850846115253, 'samples': 2500992, 'steps': 13025, 'loss/train': 1.7009488344192505} +11/06/2021 23:02:52 - INFO - __main__ - Step 13027: {'lr': 0.0004931838539384681, 'samples': 2501184, 'steps': 13026, 'loss/train': 1.87421452999115} +11/06/2021 23:02:53 - INFO - __main__ - Step 13028: {'lr': 0.0004931826231558361, 'samples': 2501376, 'steps': 13027, 'loss/train': 1.698980450630188} +11/06/2021 23:02:53 - INFO - __main__ - Step 13029: {'lr': 0.0004931813922636297, 'samples': 2501568, 'steps': 13028, 'loss/train': 2.1995387077331543} +11/06/2021 23:02:53 - INFO - __main__ - Step 13030: {'lr': 0.0004931801612618494, 'samples': 2501760, 'steps': 13029, 'loss/train': 0.9826458692550659} +11/06/2021 23:02:54 - INFO - __main__ - Step 13031: {'lr': 0.0004931789301504961, 'samples': 2501952, 'steps': 13030, 'loss/train': 1.9155287742614746} +11/06/2021 23:02:55 - INFO - __main__ - Step 13032: {'lr': 0.00049317769892957, 'samples': 2502144, 'steps': 13031, 'loss/train': 2.2658934593200684} +11/06/2021 23:02:55 - INFO - __main__ - Step 13033: {'lr': 0.0004931764675990718, 'samples': 2502336, 'steps': 13032, 'loss/train': 1.7716729640960693} +11/06/2021 23:02:56 - INFO - __main__ - Step 13034: {'lr': 0.000493175236159002, 'samples': 2502528, 'steps': 13033, 'loss/train': 2.120985269546509} +11/06/2021 23:02:56 - INFO - __main__ - Step 13035: {'lr': 0.0004931740046093612, 'samples': 2502720, 'steps': 13034, 'loss/train': 1.8945417404174805} +11/06/2021 23:02:57 - INFO - __main__ - Step 13036: {'lr': 0.0004931727729501499, 'samples': 2502912, 'steps': 13035, 'loss/train': 1.613181471824646} +11/06/2021 23:02:57 - INFO - __main__ - Step 13037: {'lr': 0.0004931715411813689, 'samples': 2503104, 'steps': 13036, 'loss/train': 1.5703870058059692} +11/06/2021 23:02:58 - INFO - __main__ - Step 13038: {'lr': 0.0004931703093030183, 'samples': 2503296, 'steps': 13037, 'loss/train': 1.6445674896240234} +11/06/2021 23:02:58 - INFO - __main__ - Step 13039: {'lr': 0.0004931690773150991, 'samples': 2503488, 'steps': 13038, 'loss/train': 1.3863145112991333} +11/06/2021 23:02:58 - INFO - __main__ - Step 13040: {'lr': 0.0004931678452176116, 'samples': 2503680, 'steps': 13039, 'loss/train': 1.5152404308319092} +11/06/2021 23:02:59 - INFO - __main__ - Step 13041: {'lr': 0.0004931666130105563, 'samples': 2503872, 'steps': 13040, 'loss/train': 1.6495338678359985} +11/06/2021 23:03:00 - INFO - __main__ - Step 13042: {'lr': 0.0004931653806939341, 'samples': 2504064, 'steps': 13041, 'loss/train': 1.6312777996063232} +11/06/2021 23:03:00 - INFO - __main__ - Step 13043: {'lr': 0.0004931641482677452, 'samples': 2504256, 'steps': 13042, 'loss/train': 1.6087427139282227} +11/06/2021 23:03:01 - INFO - __main__ - Step 13044: {'lr': 0.0004931629157319904, 'samples': 2504448, 'steps': 13043, 'loss/train': 1.2086093425750732} +11/06/2021 23:03:01 - INFO - __main__ - Step 13045: {'lr': 0.00049316168308667, 'samples': 2504640, 'steps': 13044, 'loss/train': 0.33910736441612244} +11/06/2021 23:03:02 - INFO - __main__ - Step 13046: {'lr': 0.0004931604503317846, 'samples': 2504832, 'steps': 13045, 'loss/train': 1.6171785593032837} +11/06/2021 23:03:02 - INFO - __main__ - Step 13047: {'lr': 0.0004931592174673351, 'samples': 2505024, 'steps': 13046, 'loss/train': 1.6778055429458618} +11/06/2021 23:03:03 - INFO - __main__ - Step 13048: {'lr': 0.0004931579844933218, 'samples': 2505216, 'steps': 13047, 'loss/train': 1.8838071823120117} +11/06/2021 23:03:03 - INFO - __main__ - Step 13049: {'lr': 0.0004931567514097451, 'samples': 2505408, 'steps': 13048, 'loss/train': 1.89003586769104} +11/06/2021 23:03:03 - INFO - __main__ - Step 13050: {'lr': 0.0004931555182166059, 'samples': 2505600, 'steps': 13049, 'loss/train': 1.5584383010864258} +11/06/2021 23:03:04 - INFO - __main__ - Step 13051: {'lr': 0.0004931542849139044, 'samples': 2505792, 'steps': 13050, 'loss/train': 2.8212499618530273} +11/06/2021 23:03:05 - INFO - __main__ - Step 13052: {'lr': 0.0004931530515016415, 'samples': 2505984, 'steps': 13051, 'loss/train': 1.6236906051635742} +11/06/2021 23:03:05 - INFO - __main__ - Step 13053: {'lr': 0.0004931518179798175, 'samples': 2506176, 'steps': 13052, 'loss/train': 1.8090659379959106} +11/06/2021 23:03:05 - INFO - __main__ - Step 13054: {'lr': 0.000493150584348433, 'samples': 2506368, 'steps': 13053, 'loss/train': 1.5024513006210327} +11/06/2021 23:03:06 - INFO - __main__ - Step 13055: {'lr': 0.0004931493506074886, 'samples': 2506560, 'steps': 13054, 'loss/train': 1.271149754524231} +11/06/2021 23:03:07 - INFO - __main__ - Step 13056: {'lr': 0.0004931481167569849, 'samples': 2506752, 'steps': 13055, 'loss/train': 1.1166818141937256} +11/06/2021 23:03:07 - INFO - __main__ - Step 13057: {'lr': 0.0004931468827969223, 'samples': 2506944, 'steps': 13056, 'loss/train': 1.8440206050872803} +11/06/2021 23:03:08 - INFO - __main__ - Step 13058: {'lr': 0.0004931456487273017, 'samples': 2507136, 'steps': 13057, 'loss/train': 1.7418556213378906} +11/06/2021 23:03:08 - INFO - __main__ - Step 13059: {'lr': 0.0004931444145481233, 'samples': 2507328, 'steps': 13058, 'loss/train': 1.3444815874099731} +11/06/2021 23:03:08 - INFO - __main__ - Step 13060: {'lr': 0.0004931431802593877, 'samples': 2507520, 'steps': 13059, 'loss/train': 2.082310438156128} +11/06/2021 23:03:09 - INFO - __main__ - Step 13061: {'lr': 0.0004931419458610956, 'samples': 2507712, 'steps': 13060, 'loss/train': 0.22066687047481537} +11/06/2021 23:03:10 - INFO - __main__ - Step 13062: {'lr': 0.0004931407113532476, 'samples': 2507904, 'steps': 13061, 'loss/train': 1.8766014575958252} +11/06/2021 23:03:10 - INFO - __main__ - Step 13063: {'lr': 0.000493139476735844, 'samples': 2508096, 'steps': 13062, 'loss/train': 2.6808207035064697} +11/06/2021 23:03:10 - INFO - __main__ - Step 13064: {'lr': 0.0004931382420088855, 'samples': 2508288, 'steps': 13063, 'loss/train': 1.8290174007415771} +11/06/2021 23:03:11 - INFO - __main__ - Step 13065: {'lr': 0.0004931370071723728, 'samples': 2508480, 'steps': 13064, 'loss/train': 1.6822478771209717} +11/06/2021 23:03:11 - INFO - __main__ - Step 13066: {'lr': 0.0004931357722263061, 'samples': 2508672, 'steps': 13065, 'loss/train': 1.7262883186340332} +11/06/2021 23:03:12 - INFO - __main__ - Step 13067: {'lr': 0.0004931345371706863, 'samples': 2508864, 'steps': 13066, 'loss/train': 1.8077123165130615} +11/06/2021 23:03:13 - INFO - __main__ - Step 13068: {'lr': 0.0004931333020055139, 'samples': 2509056, 'steps': 13067, 'loss/train': 1.600835919380188} +11/06/2021 23:03:13 - INFO - __main__ - Step 13069: {'lr': 0.0004931320667307893, 'samples': 2509248, 'steps': 13068, 'loss/train': 2.081484794616699} +11/06/2021 23:03:13 - INFO - __main__ - Step 13070: {'lr': 0.0004931308313465132, 'samples': 2509440, 'steps': 13069, 'loss/train': 1.9141942262649536} +11/06/2021 23:03:14 - INFO - __main__ - Step 13071: {'lr': 0.000493129595852686, 'samples': 2509632, 'steps': 13070, 'loss/train': 3.5768423080444336} +11/06/2021 23:03:15 - INFO - __main__ - Step 13072: {'lr': 0.0004931283602493084, 'samples': 2509824, 'steps': 13071, 'loss/train': 1.5225051641464233} +11/06/2021 23:03:15 - INFO - __main__ - Step 13073: {'lr': 0.0004931271245363809, 'samples': 2510016, 'steps': 13072, 'loss/train': 1.574705958366394} +11/06/2021 23:03:15 - INFO - __main__ - Step 13074: {'lr': 0.0004931258887139041, 'samples': 2510208, 'steps': 13073, 'loss/train': 1.5260777473449707} +11/06/2021 23:03:16 - INFO - __main__ - Step 13075: {'lr': 0.0004931246527818785, 'samples': 2510400, 'steps': 13074, 'loss/train': 1.26536226272583} +11/06/2021 23:03:16 - INFO - __main__ - Step 13076: {'lr': 0.0004931234167403047, 'samples': 2510592, 'steps': 13075, 'loss/train': 1.4206626415252686} +11/06/2021 23:03:17 - INFO - __main__ - Step 13077: {'lr': 0.0004931221805891833, 'samples': 2510784, 'steps': 13076, 'loss/train': 1.6260327100753784} +11/06/2021 23:03:17 - INFO - __main__ - Step 13078: {'lr': 0.0004931209443285147, 'samples': 2510976, 'steps': 13077, 'loss/train': 1.759495735168457} +11/06/2021 23:03:18 - INFO - __main__ - Step 13079: {'lr': 0.0004931197079582996, 'samples': 2511168, 'steps': 13078, 'loss/train': 1.1801636219024658} +11/06/2021 23:03:18 - INFO - __main__ - Step 13080: {'lr': 0.0004931184714785385, 'samples': 2511360, 'steps': 13079, 'loss/train': 1.9777021408081055} +11/06/2021 23:03:18 - INFO - __main__ - Step 13081: {'lr': 0.000493117234889232, 'samples': 2511552, 'steps': 13080, 'loss/train': 1.551526665687561} +11/06/2021 23:03:20 - INFO - __main__ - Step 13082: {'lr': 0.0004931159981903805, 'samples': 2511744, 'steps': 13081, 'loss/train': 1.3697116374969482} +11/06/2021 23:03:20 - INFO - __main__ - Step 13083: {'lr': 0.0004931147613819848, 'samples': 2511936, 'steps': 13082, 'loss/train': 1.5000561475753784} +11/06/2021 23:03:20 - INFO - __main__ - Step 13084: {'lr': 0.0004931135244640453, 'samples': 2512128, 'steps': 13083, 'loss/train': 1.6628344058990479} +11/06/2021 23:03:21 - INFO - __main__ - Step 13085: {'lr': 0.0004931122874365627, 'samples': 2512320, 'steps': 13084, 'loss/train': 1.448068618774414} +11/06/2021 23:03:21 - INFO - __main__ - Step 13086: {'lr': 0.0004931110502995374, 'samples': 2512512, 'steps': 13085, 'loss/train': 1.518585443496704} +11/06/2021 23:03:22 - INFO - __main__ - Step 13087: {'lr': 0.0004931098130529699, 'samples': 2512704, 'steps': 13086, 'loss/train': 2.025705099105835} +11/06/2021 23:03:22 - INFO - __main__ - Step 13088: {'lr': 0.000493108575696861, 'samples': 2512896, 'steps': 13087, 'loss/train': 1.6481513977050781} +11/06/2021 23:03:23 - INFO - __main__ - Step 13089: {'lr': 0.0004931073382312111, 'samples': 2513088, 'steps': 13088, 'loss/train': 1.394457221031189} +11/06/2021 23:03:23 - INFO - __main__ - Step 13090: {'lr': 0.0004931061006560207, 'samples': 2513280, 'steps': 13089, 'loss/train': 1.560387134552002} +11/06/2021 23:03:23 - INFO - __main__ - Step 13091: {'lr': 0.0004931048629712905, 'samples': 2513472, 'steps': 13090, 'loss/train': 1.8698866367340088} +11/06/2021 23:03:24 - INFO - __main__ - Step 13092: {'lr': 0.000493103625177021, 'samples': 2513664, 'steps': 13091, 'loss/train': 2.115483522415161} +11/06/2021 23:03:25 - INFO - __main__ - Step 13093: {'lr': 0.0004931023872732128, 'samples': 2513856, 'steps': 13092, 'loss/train': 1.7177084684371948} +11/06/2021 23:03:25 - INFO - __main__ - Step 13094: {'lr': 0.0004931011492598664, 'samples': 2514048, 'steps': 13093, 'loss/train': 0.9922665953636169} +11/06/2021 23:03:25 - INFO - __main__ - Step 13095: {'lr': 0.0004930999111369824, 'samples': 2514240, 'steps': 13094, 'loss/train': 1.6571738719940186} +11/06/2021 23:03:26 - INFO - __main__ - Step 13096: {'lr': 0.0004930986729045613, 'samples': 2514432, 'steps': 13095, 'loss/train': 1.8621472120285034} +11/06/2021 23:03:26 - INFO - __main__ - Step 13097: {'lr': 0.0004930974345626036, 'samples': 2514624, 'steps': 13096, 'loss/train': 1.177014708518982} +11/06/2021 23:03:27 - INFO - __main__ - Step 13098: {'lr': 0.00049309619611111, 'samples': 2514816, 'steps': 13097, 'loss/train': 1.6075189113616943} +11/06/2021 23:03:28 - INFO - __main__ - Step 13099: {'lr': 0.000493094957550081, 'samples': 2515008, 'steps': 13098, 'loss/train': 1.3369756937026978} +11/06/2021 23:03:28 - INFO - __main__ - Step 13100: {'lr': 0.0004930937188795172, 'samples': 2515200, 'steps': 13099, 'loss/train': 1.7597624063491821} +11/06/2021 23:03:28 - INFO - __main__ - Step 13101: {'lr': 0.0004930924800994192, 'samples': 2515392, 'steps': 13100, 'loss/train': 1.1955498456954956} +11/06/2021 23:03:29 - INFO - __main__ - Step 13102: {'lr': 0.0004930912412097874, 'samples': 2515584, 'steps': 13101, 'loss/train': 2.0432753562927246} +11/06/2021 23:03:30 - INFO - __main__ - Step 13103: {'lr': 0.0004930900022106224, 'samples': 2515776, 'steps': 13102, 'loss/train': 1.897919774055481} +11/06/2021 23:03:30 - INFO - __main__ - Step 13104: {'lr': 0.0004930887631019248, 'samples': 2515968, 'steps': 13103, 'loss/train': 1.3024754524230957} +11/06/2021 23:03:30 - INFO - __main__ - Step 13105: {'lr': 0.0004930875238836951, 'samples': 2516160, 'steps': 13104, 'loss/train': 1.7677634954452515} +11/06/2021 23:03:31 - INFO - __main__ - Step 13106: {'lr': 0.000493086284555934, 'samples': 2516352, 'steps': 13105, 'loss/train': 2.061279773712158} +11/06/2021 23:03:31 - INFO - __main__ - Step 13107: {'lr': 0.0004930850451186421, 'samples': 2516544, 'steps': 13106, 'loss/train': 1.8709264993667603} +11/06/2021 23:03:32 - INFO - __main__ - Step 13108: {'lr': 0.0004930838055718196, 'samples': 2516736, 'steps': 13107, 'loss/train': 1.6638407707214355} +11/06/2021 23:03:32 - INFO - __main__ - Step 13109: {'lr': 0.0004930825659154674, 'samples': 2516928, 'steps': 13108, 'loss/train': 0.959062397480011} +11/06/2021 23:03:33 - INFO - __main__ - Step 13110: {'lr': 0.000493081326149586, 'samples': 2517120, 'steps': 13109, 'loss/train': 1.8210927248001099} +11/06/2021 23:03:33 - INFO - __main__ - Step 13111: {'lr': 0.0004930800862741758, 'samples': 2517312, 'steps': 13110, 'loss/train': 1.239546775817871} +11/06/2021 23:03:33 - INFO - __main__ - Step 13112: {'lr': 0.0004930788462892375, 'samples': 2517504, 'steps': 13111, 'loss/train': 1.4559482336044312} +11/06/2021 23:03:34 - INFO - __main__ - Step 13113: {'lr': 0.0004930776061947716, 'samples': 2517696, 'steps': 13112, 'loss/train': 1.6347291469573975} +11/06/2021 23:03:35 - INFO - __main__ - Step 13114: {'lr': 0.0004930763659907788, 'samples': 2517888, 'steps': 13113, 'loss/train': 1.7659398317337036} +11/06/2021 23:03:35 - INFO - __main__ - Step 13115: {'lr': 0.0004930751256772593, 'samples': 2518080, 'steps': 13114, 'loss/train': 1.8895224332809448} +11/06/2021 23:03:35 - INFO - __main__ - Step 13116: {'lr': 0.0004930738852542141, 'samples': 2518272, 'steps': 13115, 'loss/train': 1.4143397808074951} +11/06/2021 23:03:36 - INFO - __main__ - Step 13117: {'lr': 0.0004930726447216435, 'samples': 2518464, 'steps': 13116, 'loss/train': 2.018646240234375} +11/06/2021 23:03:37 - INFO - __main__ - Step 13118: {'lr': 0.0004930714040795481, 'samples': 2518656, 'steps': 13117, 'loss/train': 1.5822020769119263} +11/06/2021 23:03:37 - INFO - __main__ - Step 13119: {'lr': 0.0004930701633279285, 'samples': 2518848, 'steps': 13118, 'loss/train': 1.5482772588729858} +11/06/2021 23:03:38 - INFO - __main__ - Step 13120: {'lr': 0.0004930689224667853, 'samples': 2519040, 'steps': 13119, 'loss/train': 1.1191784143447876} +11/06/2021 23:03:38 - INFO - __main__ - Step 13121: {'lr': 0.0004930676814961189, 'samples': 2519232, 'steps': 13120, 'loss/train': 1.5763609409332275} +11/06/2021 23:03:38 - INFO - __main__ - Step 13122: {'lr': 0.00049306644041593, 'samples': 2519424, 'steps': 13121, 'loss/train': 1.3790456056594849} +11/06/2021 23:03:40 - INFO - __main__ - Step 13123: {'lr': 0.0004930651992262191, 'samples': 2519616, 'steps': 13122, 'loss/train': 1.3503462076187134} +11/06/2021 23:03:40 - INFO - __main__ - Step 13124: {'lr': 0.0004930639579269866, 'samples': 2519808, 'steps': 13123, 'loss/train': 1.4450675249099731} +11/06/2021 23:03:41 - INFO - __main__ - Step 13125: {'lr': 0.0004930627165182335, 'samples': 2520000, 'steps': 13124, 'loss/train': 1.5567551851272583} +11/06/2021 23:03:41 - INFO - __main__ - Step 13126: {'lr': 0.00049306147499996, 'samples': 2520192, 'steps': 13125, 'loss/train': 1.7951613664627075} +11/06/2021 23:03:42 - INFO - __main__ - Step 13127: {'lr': 0.0004930602333721667, 'samples': 2520384, 'steps': 13126, 'loss/train': 1.6020070314407349} +11/06/2021 23:03:42 - INFO - __main__ - Step 13128: {'lr': 0.0004930589916348542, 'samples': 2520576, 'steps': 13127, 'loss/train': 1.8576689958572388} +11/06/2021 23:03:42 - INFO - __main__ - Step 13129: {'lr': 0.0004930577497880231, 'samples': 2520768, 'steps': 13128, 'loss/train': 1.8128331899642944} +11/06/2021 23:03:43 - INFO - __main__ - Step 13130: {'lr': 0.000493056507831674, 'samples': 2520960, 'steps': 13129, 'loss/train': 1.8191680908203125} +11/06/2021 23:03:44 - INFO - __main__ - Step 13131: {'lr': 0.0004930552657658073, 'samples': 2521152, 'steps': 13130, 'loss/train': 1.0424447059631348} +11/06/2021 23:03:44 - INFO - __main__ - Step 13132: {'lr': 0.0004930540235904237, 'samples': 2521344, 'steps': 13131, 'loss/train': 0.9502253532409668} +11/06/2021 23:03:44 - INFO - __main__ - Step 13133: {'lr': 0.0004930527813055237, 'samples': 2521536, 'steps': 13132, 'loss/train': 2.1043529510498047} +11/06/2021 23:03:45 - INFO - __main__ - Step 13134: {'lr': 0.0004930515389111078, 'samples': 2521728, 'steps': 13133, 'loss/train': 1.6203279495239258} +11/06/2021 23:03:46 - INFO - __main__ - Step 13135: {'lr': 0.0004930502964071767, 'samples': 2521920, 'steps': 13134, 'loss/train': 1.872376561164856} +11/06/2021 23:03:46 - INFO - __main__ - Step 13136: {'lr': 0.0004930490537937309, 'samples': 2522112, 'steps': 13135, 'loss/train': 1.530863881111145} +11/06/2021 23:03:46 - INFO - __main__ - Step 13137: {'lr': 0.0004930478110707709, 'samples': 2522304, 'steps': 13136, 'loss/train': 1.446254014968872} +11/06/2021 23:03:47 - INFO - __main__ - Step 13138: {'lr': 0.0004930465682382973, 'samples': 2522496, 'steps': 13137, 'loss/train': 2.3736038208007812} +11/06/2021 23:03:47 - INFO - __main__ - Step 13139: {'lr': 0.0004930453252963107, 'samples': 2522688, 'steps': 13138, 'loss/train': 1.7954354286193848} +11/06/2021 23:03:48 - INFO - __main__ - Step 13140: {'lr': 0.0004930440822448115, 'samples': 2522880, 'steps': 13139, 'loss/train': 1.4115676879882812} +11/06/2021 23:03:48 - INFO - __main__ - Step 13141: {'lr': 0.0004930428390838006, 'samples': 2523072, 'steps': 13140, 'loss/train': 1.7960898876190186} +11/06/2021 23:03:49 - INFO - __main__ - Step 13142: {'lr': 0.0004930415958132782, 'samples': 2523264, 'steps': 13141, 'loss/train': 1.5703538656234741} +11/06/2021 23:03:49 - INFO - __main__ - Step 13143: {'lr': 0.0004930403524332451, 'samples': 2523456, 'steps': 13142, 'loss/train': 1.3508336544036865} +11/06/2021 23:03:50 - INFO - __main__ - Step 13144: {'lr': 0.0004930391089437017, 'samples': 2523648, 'steps': 13143, 'loss/train': 1.7475541830062866} +11/06/2021 23:03:51 - INFO - __main__ - Step 13145: {'lr': 0.0004930378653446487, 'samples': 2523840, 'steps': 13144, 'loss/train': 1.8159362077713013} +11/06/2021 23:03:51 - INFO - __main__ - Step 13146: {'lr': 0.0004930366216360865, 'samples': 2524032, 'steps': 13145, 'loss/train': 1.6725317239761353} +11/06/2021 23:03:51 - INFO - __main__ - Step 13147: {'lr': 0.0004930353778180158, 'samples': 2524224, 'steps': 13146, 'loss/train': 1.5883946418762207} +11/06/2021 23:03:52 - INFO - __main__ - Step 13148: {'lr': 0.0004930341338904371, 'samples': 2524416, 'steps': 13147, 'loss/train': 1.889960765838623} +11/06/2021 23:03:52 - INFO - __main__ - Step 13149: {'lr': 0.000493032889853351, 'samples': 2524608, 'steps': 13148, 'loss/train': 1.9227193593978882} +11/06/2021 23:03:53 - INFO - __main__ - Step 13150: {'lr': 0.0004930316457067579, 'samples': 2524800, 'steps': 13149, 'loss/train': 1.51223886013031} +11/06/2021 23:03:53 - INFO - __main__ - Step 13151: {'lr': 0.0004930304014506586, 'samples': 2524992, 'steps': 13150, 'loss/train': 1.603259801864624} +11/06/2021 23:03:54 - INFO - __main__ - Step 13152: {'lr': 0.0004930291570850536, 'samples': 2525184, 'steps': 13151, 'loss/train': 1.576635479927063} +11/06/2021 23:03:54 - INFO - __main__ - Step 13153: {'lr': 0.0004930279126099433, 'samples': 2525376, 'steps': 13152, 'loss/train': 1.0832215547561646} +11/06/2021 23:03:54 - INFO - __main__ - Step 13154: {'lr': 0.0004930266680253284, 'samples': 2525568, 'steps': 13153, 'loss/train': 1.7394440174102783} +11/06/2021 23:03:55 - INFO - __main__ - Step 13155: {'lr': 0.0004930254233312095, 'samples': 2525760, 'steps': 13154, 'loss/train': 1.2529510259628296} +11/06/2021 23:03:56 - INFO - __main__ - Step 13156: {'lr': 0.000493024178527587, 'samples': 2525952, 'steps': 13155, 'loss/train': 2.2869997024536133} +11/06/2021 23:03:56 - INFO - __main__ - Step 13157: {'lr': 0.0004930229336144616, 'samples': 2526144, 'steps': 13156, 'loss/train': 1.7819799184799194} +11/06/2021 23:03:56 - INFO - __main__ - Step 13158: {'lr': 0.0004930216885918339, 'samples': 2526336, 'steps': 13157, 'loss/train': 1.7473498582839966} +11/06/2021 23:03:57 - INFO - __main__ - Step 13159: {'lr': 0.0004930204434597042, 'samples': 2526528, 'steps': 13158, 'loss/train': 1.48399019241333} +11/06/2021 23:03:57 - INFO - __main__ - Step 13160: {'lr': 0.0004930191982180734, 'samples': 2526720, 'steps': 13159, 'loss/train': 1.5737640857696533} +11/06/2021 23:03:58 - INFO - __main__ - Step 13161: {'lr': 0.0004930179528669418, 'samples': 2526912, 'steps': 13160, 'loss/train': 2.018446683883667} +11/06/2021 23:03:59 - INFO - __main__ - Step 13162: {'lr': 0.0004930167074063101, 'samples': 2527104, 'steps': 13161, 'loss/train': 1.7737540006637573} +11/06/2021 23:03:59 - INFO - __main__ - Step 13163: {'lr': 0.0004930154618361789, 'samples': 2527296, 'steps': 13162, 'loss/train': 1.867935299873352} +11/06/2021 23:03:59 - INFO - __main__ - Step 13164: {'lr': 0.0004930142161565486, 'samples': 2527488, 'steps': 13163, 'loss/train': 2.0381977558135986} +11/06/2021 23:04:00 - INFO - __main__ - Step 13165: {'lr': 0.0004930129703674198, 'samples': 2527680, 'steps': 13164, 'loss/train': 1.8840910196304321} +11/06/2021 23:04:01 - INFO - __main__ - Step 13166: {'lr': 0.0004930117244687931, 'samples': 2527872, 'steps': 13165, 'loss/train': 1.4074156284332275} +11/06/2021 23:04:01 - INFO - __main__ - Step 13167: {'lr': 0.0004930104784606692, 'samples': 2528064, 'steps': 13166, 'loss/train': 2.063450813293457} +11/06/2021 23:04:01 - INFO - __main__ - Step 13168: {'lr': 0.0004930092323430484, 'samples': 2528256, 'steps': 13167, 'loss/train': 2.0765469074249268} +11/06/2021 23:04:02 - INFO - __main__ - Step 13169: {'lr': 0.0004930079861159315, 'samples': 2528448, 'steps': 13168, 'loss/train': 1.3868030309677124} +11/06/2021 23:04:02 - INFO - __main__ - Step 13170: {'lr': 0.0004930067397793188, 'samples': 2528640, 'steps': 13169, 'loss/train': 1.732783317565918} +11/06/2021 23:04:03 - INFO - __main__ - Step 13171: {'lr': 0.0004930054933332111, 'samples': 2528832, 'steps': 13170, 'loss/train': 1.683578610420227} +11/06/2021 23:04:03 - INFO - __main__ - Step 13172: {'lr': 0.0004930042467776089, 'samples': 2529024, 'steps': 13171, 'loss/train': 1.720359206199646} +11/06/2021 23:04:04 - INFO - __main__ - Step 13173: {'lr': 0.0004930030001125128, 'samples': 2529216, 'steps': 13172, 'loss/train': 1.2218900918960571} +11/06/2021 23:04:04 - INFO - __main__ - Step 13174: {'lr': 0.000493001753337923, 'samples': 2529408, 'steps': 13173, 'loss/train': 1.542048692703247} +11/06/2021 23:04:04 - INFO - __main__ - Step 13175: {'lr': 0.0004930005064538406, 'samples': 2529600, 'steps': 13174, 'loss/train': 1.7872868776321411} +11/06/2021 23:04:05 - INFO - __main__ - Step 13176: {'lr': 0.0004929992594602659, 'samples': 2529792, 'steps': 13175, 'loss/train': 1.104972243309021} +11/06/2021 23:04:06 - INFO - __main__ - Step 13177: {'lr': 0.0004929980123571995, 'samples': 2529984, 'steps': 13176, 'loss/train': 1.122475504875183} +11/06/2021 23:04:06 - INFO - __main__ - Step 13178: {'lr': 0.000492996765144642, 'samples': 2530176, 'steps': 13177, 'loss/train': 1.7249083518981934} +11/06/2021 23:04:07 - INFO - __main__ - Step 13179: {'lr': 0.0004929955178225938, 'samples': 2530368, 'steps': 13178, 'loss/train': 1.1565667390823364} +11/06/2021 23:04:07 - INFO - __main__ - Step 13180: {'lr': 0.0004929942703910556, 'samples': 2530560, 'steps': 13179, 'loss/train': 2.3176705837249756} +11/06/2021 23:04:07 - INFO - __main__ - Step 13181: {'lr': 0.0004929930228500279, 'samples': 2530752, 'steps': 13180, 'loss/train': 1.5887360572814941} +11/06/2021 23:04:09 - INFO - __main__ - Step 13182: {'lr': 0.0004929917751995114, 'samples': 2530944, 'steps': 13181, 'loss/train': 1.8893414735794067} +11/06/2021 23:04:09 - INFO - __main__ - Step 13183: {'lr': 0.0004929905274395064, 'samples': 2531136, 'steps': 13182, 'loss/train': 1.7040241956710815} +11/06/2021 23:04:09 - INFO - __main__ - Step 13184: {'lr': 0.0004929892795700137, 'samples': 2531328, 'steps': 13183, 'loss/train': 1.8834102153778076} +11/06/2021 23:04:10 - INFO - __main__ - Step 13185: {'lr': 0.0004929880315910338, 'samples': 2531520, 'steps': 13184, 'loss/train': 0.39340120553970337} +11/06/2021 23:04:10 - INFO - __main__ - Step 13186: {'lr': 0.0004929867835025672, 'samples': 2531712, 'steps': 13185, 'loss/train': 0.29085573554039} +11/06/2021 23:04:10 - INFO - __main__ - Step 13187: {'lr': 0.0004929855353046145, 'samples': 2531904, 'steps': 13186, 'loss/train': 1.7704241275787354} +11/06/2021 23:04:11 - INFO - __main__ - Step 13188: {'lr': 0.0004929842869971763, 'samples': 2532096, 'steps': 13187, 'loss/train': 1.63791024684906} +11/06/2021 23:04:12 - INFO - __main__ - Step 13189: {'lr': 0.000492983038580253, 'samples': 2532288, 'steps': 13188, 'loss/train': 0.9975517392158508} +11/06/2021 23:04:12 - INFO - __main__ - Step 13190: {'lr': 0.0004929817900538455, 'samples': 2532480, 'steps': 13189, 'loss/train': 1.4178115129470825} +11/06/2021 23:04:12 - INFO - __main__ - Step 13191: {'lr': 0.000492980541417954, 'samples': 2532672, 'steps': 13190, 'loss/train': 1.3342525959014893} +11/06/2021 23:04:13 - INFO - __main__ - Step 13192: {'lr': 0.0004929792926725794, 'samples': 2532864, 'steps': 13191, 'loss/train': 1.589043140411377} +11/06/2021 23:04:14 - INFO - __main__ - Step 13193: {'lr': 0.000492978043817722, 'samples': 2533056, 'steps': 13192, 'loss/train': 1.7581723928451538} +11/06/2021 23:04:14 - INFO - __main__ - Step 13194: {'lr': 0.0004929767948533823, 'samples': 2533248, 'steps': 13193, 'loss/train': 1.6882779598236084} +11/06/2021 23:04:15 - INFO - __main__ - Step 13195: {'lr': 0.0004929755457795612, 'samples': 2533440, 'steps': 13194, 'loss/train': 1.444657802581787} +11/06/2021 23:04:15 - INFO - __main__ - Step 13196: {'lr': 0.0004929742965962589, 'samples': 2533632, 'steps': 13195, 'loss/train': 1.9157907962799072} +11/06/2021 23:04:15 - INFO - __main__ - Step 13197: {'lr': 0.0004929730473034763, 'samples': 2533824, 'steps': 13196, 'loss/train': 1.561155915260315} +11/06/2021 23:04:16 - INFO - __main__ - Step 13198: {'lr': 0.0004929717979012136, 'samples': 2534016, 'steps': 13197, 'loss/train': 1.3841657638549805} +11/06/2021 23:04:17 - INFO - __main__ - Step 13199: {'lr': 0.0004929705483894717, 'samples': 2534208, 'steps': 13198, 'loss/train': 1.5719326734542847} +11/06/2021 23:04:17 - INFO - __main__ - Step 13200: {'lr': 0.000492969298768251, 'samples': 2534400, 'steps': 13199, 'loss/train': 1.4586410522460938} +11/06/2021 23:04:17 - INFO - __main__ - Step 13201: {'lr': 0.000492968049037552, 'samples': 2534592, 'steps': 13200, 'loss/train': 1.2632533311843872} +11/06/2021 23:04:18 - INFO - __main__ - Step 13202: {'lr': 0.0004929667991973754, 'samples': 2534784, 'steps': 13201, 'loss/train': 1.835030436515808} +11/06/2021 23:04:19 - INFO - __main__ - Step 13203: {'lr': 0.0004929655492477218, 'samples': 2534976, 'steps': 13202, 'loss/train': 2.025620937347412} +11/06/2021 23:04:19 - INFO - __main__ - Step 13204: {'lr': 0.0004929642991885916, 'samples': 2535168, 'steps': 13203, 'loss/train': 1.8089247941970825} +11/06/2021 23:04:20 - INFO - __main__ - Step 13205: {'lr': 0.0004929630490199854, 'samples': 2535360, 'steps': 13204, 'loss/train': 1.419128656387329} +11/06/2021 23:04:20 - INFO - __main__ - Step 13206: {'lr': 0.0004929617987419039, 'samples': 2535552, 'steps': 13205, 'loss/train': 1.9509419202804565} +11/06/2021 23:04:20 - INFO - __main__ - Step 13207: {'lr': 0.0004929605483543474, 'samples': 2535744, 'steps': 13206, 'loss/train': 1.7414957284927368} +11/06/2021 23:04:21 - INFO - __main__ - Step 13208: {'lr': 0.0004929592978573168, 'samples': 2535936, 'steps': 13207, 'loss/train': 1.3497000932693481} +11/06/2021 23:04:22 - INFO - __main__ - Step 13209: {'lr': 0.0004929580472508124, 'samples': 2536128, 'steps': 13208, 'loss/train': 1.4849274158477783} +11/06/2021 23:04:22 - INFO - __main__ - Step 13210: {'lr': 0.0004929567965348347, 'samples': 2536320, 'steps': 13209, 'loss/train': 1.7661024332046509} +11/06/2021 23:04:22 - INFO - __main__ - Step 13211: {'lr': 0.0004929555457093847, 'samples': 2536512, 'steps': 13210, 'loss/train': 1.7493226528167725} +11/06/2021 23:04:23 - INFO - __main__ - Step 13212: {'lr': 0.0004929542947744625, 'samples': 2536704, 'steps': 13211, 'loss/train': 1.1652683019638062} +11/06/2021 23:04:23 - INFO - __main__ - Step 13213: {'lr': 0.0004929530437300689, 'samples': 2536896, 'steps': 13212, 'loss/train': 1.901105284690857} +11/06/2021 23:04:24 - INFO - __main__ - Step 13214: {'lr': 0.0004929517925762045, 'samples': 2537088, 'steps': 13213, 'loss/train': 1.7152559757232666} +11/06/2021 23:04:24 - INFO - __main__ - Step 13215: {'lr': 0.0004929505413128696, 'samples': 2537280, 'steps': 13214, 'loss/train': 1.5080220699310303} +11/06/2021 23:04:25 - INFO - __main__ - Step 13216: {'lr': 0.000492949289940065, 'samples': 2537472, 'steps': 13215, 'loss/train': 1.7063556909561157} +11/06/2021 23:04:25 - INFO - __main__ - Step 13217: {'lr': 0.0004929480384577912, 'samples': 2537664, 'steps': 13216, 'loss/train': 1.8721396923065186} +11/06/2021 23:04:25 - INFO - __main__ - Step 13218: {'lr': 0.0004929467868660487, 'samples': 2537856, 'steps': 13217, 'loss/train': 1.3065961599349976} +11/06/2021 23:04:27 - INFO - __main__ - Step 13219: {'lr': 0.0004929455351648383, 'samples': 2538048, 'steps': 13218, 'loss/train': 1.533849835395813} +11/06/2021 23:04:27 - INFO - __main__ - Step 13220: {'lr': 0.0004929442833541603, 'samples': 2538240, 'steps': 13219, 'loss/train': 1.7814805507659912} +11/06/2021 23:04:27 - INFO - __main__ - Step 13221: {'lr': 0.0004929430314340154, 'samples': 2538432, 'steps': 13220, 'loss/train': 1.5206717252731323} +11/06/2021 23:04:28 - INFO - __main__ - Step 13222: {'lr': 0.000492941779404404, 'samples': 2538624, 'steps': 13221, 'loss/train': 1.3217058181762695} +11/06/2021 23:04:28 - INFO - __main__ - Step 13223: {'lr': 0.0004929405272653269, 'samples': 2538816, 'steps': 13222, 'loss/train': 1.758650302886963} +11/06/2021 23:04:29 - INFO - __main__ - Step 13224: {'lr': 0.0004929392750167845, 'samples': 2539008, 'steps': 13223, 'loss/train': 0.7512359023094177} +11/06/2021 23:04:29 - INFO - __main__ - Step 13225: {'lr': 0.0004929380226587774, 'samples': 2539200, 'steps': 13224, 'loss/train': 1.9796491861343384} +11/06/2021 23:04:30 - INFO - __main__ - Step 13226: {'lr': 0.0004929367701913062, 'samples': 2539392, 'steps': 13225, 'loss/train': 0.7901928424835205} +11/06/2021 23:04:30 - INFO - __main__ - Step 13227: {'lr': 0.0004929355176143714, 'samples': 2539584, 'steps': 13226, 'loss/train': 1.6296266317367554} +11/06/2021 23:04:30 - INFO - __main__ - Step 13228: {'lr': 0.0004929342649279736, 'samples': 2539776, 'steps': 13227, 'loss/train': 2.2642016410827637} +11/06/2021 23:04:31 - INFO - __main__ - Step 13229: {'lr': 0.0004929330121321134, 'samples': 2539968, 'steps': 13228, 'loss/train': 1.9576764106750488} +11/06/2021 23:04:32 - INFO - __main__ - Step 13230: {'lr': 0.0004929317592267913, 'samples': 2540160, 'steps': 13229, 'loss/train': 1.3771681785583496} +11/06/2021 23:04:32 - INFO - __main__ - Step 13231: {'lr': 0.000492930506212008, 'samples': 2540352, 'steps': 13230, 'loss/train': 1.4580309391021729} +11/06/2021 23:04:32 - INFO - __main__ - Step 13232: {'lr': 0.0004929292530877638, 'samples': 2540544, 'steps': 13231, 'loss/train': 1.5122207403182983} +11/06/2021 23:04:33 - INFO - __main__ - Step 13233: {'lr': 0.0004929279998540596, 'samples': 2540736, 'steps': 13232, 'loss/train': 1.770660400390625} +11/06/2021 23:04:34 - INFO - __main__ - Step 13234: {'lr': 0.0004929267465108956, 'samples': 2540928, 'steps': 13233, 'loss/train': 0.6602691411972046} +11/06/2021 23:04:34 - INFO - __main__ - Step 13235: {'lr': 0.0004929254930582728, 'samples': 2541120, 'steps': 13234, 'loss/train': 1.746626853942871} +11/06/2021 23:04:35 - INFO - __main__ - Step 13236: {'lr': 0.0004929242394961914, 'samples': 2541312, 'steps': 13235, 'loss/train': 1.5053402185440063} +11/06/2021 23:04:35 - INFO - __main__ - Step 13237: {'lr': 0.000492922985824652, 'samples': 2541504, 'steps': 13236, 'loss/train': 1.3967210054397583} +11/06/2021 23:04:35 - INFO - __main__ - Step 13238: {'lr': 0.0004929217320436553, 'samples': 2541696, 'steps': 13237, 'loss/train': 1.8607147932052612} +11/06/2021 23:04:36 - INFO - __main__ - Step 13239: {'lr': 0.0004929204781532018, 'samples': 2541888, 'steps': 13238, 'loss/train': 1.915743112564087} +11/06/2021 23:04:37 - INFO - __main__ - Step 13240: {'lr': 0.0004929192241532921, 'samples': 2542080, 'steps': 13239, 'loss/train': 1.5825774669647217} +11/06/2021 23:04:37 - INFO - __main__ - Step 13241: {'lr': 0.0004929179700439269, 'samples': 2542272, 'steps': 13240, 'loss/train': 0.8731245994567871} +11/06/2021 23:04:37 - INFO - __main__ - Step 13242: {'lr': 0.0004929167158251065, 'samples': 2542464, 'steps': 13241, 'loss/train': 1.7549324035644531} +11/06/2021 23:04:38 - INFO - __main__ - Step 13243: {'lr': 0.0004929154614968315, 'samples': 2542656, 'steps': 13242, 'loss/train': 0.5492236614227295} +11/06/2021 23:04:39 - INFO - __main__ - Step 13244: {'lr': 0.0004929142070591026, 'samples': 2542848, 'steps': 13243, 'loss/train': 1.614729404449463} +11/06/2021 23:04:39 - INFO - __main__ - Step 13245: {'lr': 0.0004929129525119203, 'samples': 2543040, 'steps': 13244, 'loss/train': 1.537818193435669} +11/06/2021 23:04:40 - INFO - __main__ - Step 13246: {'lr': 0.0004929116978552851, 'samples': 2543232, 'steps': 13245, 'loss/train': 1.7951061725616455} +11/06/2021 23:04:40 - INFO - __main__ - Step 13247: {'lr': 0.0004929104430891978, 'samples': 2543424, 'steps': 13246, 'loss/train': 1.5061917304992676} +11/06/2021 23:04:40 - INFO - __main__ - Step 13248: {'lr': 0.0004929091882136587, 'samples': 2543616, 'steps': 13247, 'loss/train': 1.6849573850631714} +11/06/2021 23:04:41 - INFO - __main__ - Step 13249: {'lr': 0.0004929079332286685, 'samples': 2543808, 'steps': 13248, 'loss/train': 1.7223663330078125} +11/06/2021 23:04:42 - INFO - __main__ - Step 13250: {'lr': 0.0004929066781342277, 'samples': 2544000, 'steps': 13249, 'loss/train': 1.109410285949707} +11/06/2021 23:04:42 - INFO - __main__ - Step 13251: {'lr': 0.0004929054229303369, 'samples': 2544192, 'steps': 13250, 'loss/train': 1.5786045789718628} +11/06/2021 23:04:42 - INFO - __main__ - Step 13252: {'lr': 0.0004929041676169967, 'samples': 2544384, 'steps': 13251, 'loss/train': 1.4510022401809692} +11/06/2021 23:04:43 - INFO - __main__ - Step 13253: {'lr': 0.0004929029121942077, 'samples': 2544576, 'steps': 13252, 'loss/train': 1.5690830945968628} +11/06/2021 23:04:43 - INFO - __main__ - Step 13254: {'lr': 0.0004929016566619703, 'samples': 2544768, 'steps': 13253, 'loss/train': 1.475024938583374} +11/06/2021 23:04:44 - INFO - __main__ - Step 13255: {'lr': 0.0004929004010202851, 'samples': 2544960, 'steps': 13254, 'loss/train': 1.462422490119934} +11/06/2021 23:04:44 - INFO - __main__ - Step 13256: {'lr': 0.0004928991452691528, 'samples': 2545152, 'steps': 13255, 'loss/train': 1.8692861795425415} +11/06/2021 23:04:45 - INFO - __main__ - Step 13257: {'lr': 0.0004928978894085739, 'samples': 2545344, 'steps': 13256, 'loss/train': 1.8582710027694702} +11/06/2021 23:04:45 - INFO - __main__ - Step 13258: {'lr': 0.000492896633438549, 'samples': 2545536, 'steps': 13257, 'loss/train': 2.016894578933716} +11/06/2021 23:04:46 - INFO - __main__ - Step 13259: {'lr': 0.0004928953773590785, 'samples': 2545728, 'steps': 13258, 'loss/train': 1.6744557619094849} +11/06/2021 23:04:47 - INFO - __main__ - Step 13260: {'lr': 0.0004928941211701632, 'samples': 2545920, 'steps': 13259, 'loss/train': 0.2616555988788605} +11/06/2021 23:04:47 - INFO - __main__ - Step 13261: {'lr': 0.0004928928648718035, 'samples': 2546112, 'steps': 13260, 'loss/train': 1.6083446741104126} +11/06/2021 23:04:47 - INFO - __main__ - Step 13262: {'lr': 0.0004928916084640001, 'samples': 2546304, 'steps': 13261, 'loss/train': 1.1888530254364014} +11/06/2021 23:04:48 - INFO - __main__ - Step 13263: {'lr': 0.0004928903519467534, 'samples': 2546496, 'steps': 13262, 'loss/train': 2.4009814262390137} +11/06/2021 23:04:48 - INFO - __main__ - Step 13264: {'lr': 0.0004928890953200641, 'samples': 2546688, 'steps': 13263, 'loss/train': 1.301665186882019} +11/06/2021 23:04:49 - INFO - __main__ - Step 13265: {'lr': 0.0004928878385839327, 'samples': 2546880, 'steps': 13264, 'loss/train': 1.293091058731079} +11/06/2021 23:04:49 - INFO - __main__ - Step 13266: {'lr': 0.0004928865817383597, 'samples': 2547072, 'steps': 13265, 'loss/train': 1.251847267150879} +11/06/2021 23:04:50 - INFO - __main__ - Step 13267: {'lr': 0.0004928853247833459, 'samples': 2547264, 'steps': 13266, 'loss/train': 1.894822120666504} +11/06/2021 23:04:50 - INFO - __main__ - Step 13268: {'lr': 0.0004928840677188918, 'samples': 2547456, 'steps': 13267, 'loss/train': 1.5503804683685303} +11/06/2021 23:04:50 - INFO - __main__ - Step 13269: {'lr': 0.0004928828105449977, 'samples': 2547648, 'steps': 13268, 'loss/train': 1.885050892829895} +11/06/2021 23:04:52 - INFO - __main__ - Step 13270: {'lr': 0.0004928815532616644, 'samples': 2547840, 'steps': 13269, 'loss/train': 1.5068950653076172} +11/06/2021 23:04:52 - INFO - __main__ - Step 13271: {'lr': 0.0004928802958688924, 'samples': 2548032, 'steps': 13270, 'loss/train': 1.590198040008545} +11/06/2021 23:04:52 - INFO - __main__ - Step 13272: {'lr': 0.0004928790383666823, 'samples': 2548224, 'steps': 13271, 'loss/train': 1.786717176437378} +11/06/2021 23:04:53 - INFO - __main__ - Step 13273: {'lr': 0.0004928777807550348, 'samples': 2548416, 'steps': 13272, 'loss/train': 1.5326136350631714} +11/06/2021 23:04:53 - INFO - __main__ - Step 13274: {'lr': 0.0004928765230339502, 'samples': 2548608, 'steps': 13273, 'loss/train': 2.4051101207733154} +11/06/2021 23:04:54 - INFO - __main__ - Step 13275: {'lr': 0.000492875265203429, 'samples': 2548800, 'steps': 13274, 'loss/train': 2.304696559906006} +11/06/2021 23:04:54 - INFO - __main__ - Step 13276: {'lr': 0.0004928740072634722, 'samples': 2548992, 'steps': 13275, 'loss/train': 2.0685250759124756} +11/06/2021 23:04:55 - INFO - __main__ - Step 13277: {'lr': 0.0004928727492140801, 'samples': 2549184, 'steps': 13276, 'loss/train': 1.733903408050537} +11/06/2021 23:04:55 - INFO - __main__ - Step 13278: {'lr': 0.0004928714910552533, 'samples': 2549376, 'steps': 13277, 'loss/train': 1.8066354990005493} +11/06/2021 23:04:55 - INFO - __main__ - Step 13279: {'lr': 0.0004928702327869922, 'samples': 2549568, 'steps': 13278, 'loss/train': 1.9759420156478882} +11/06/2021 23:04:56 - INFO - __main__ - Step 13280: {'lr': 0.0004928689744092976, 'samples': 2549760, 'steps': 13279, 'loss/train': 1.8017091751098633} +11/06/2021 23:04:57 - INFO - __main__ - Step 13281: {'lr': 0.0004928677159221701, 'samples': 2549952, 'steps': 13280, 'loss/train': 1.4251042604446411} +11/06/2021 23:04:57 - INFO - __main__ - Step 13282: {'lr': 0.00049286645732561, 'samples': 2550144, 'steps': 13281, 'loss/train': 1.3295786380767822} +11/06/2021 23:04:57 - INFO - __main__ - Step 13283: {'lr': 0.0004928651986196181, 'samples': 2550336, 'steps': 13282, 'loss/train': 1.1968010663986206} +11/06/2021 23:04:58 - INFO - __main__ - Step 13284: {'lr': 0.0004928639398041948, 'samples': 2550528, 'steps': 13283, 'loss/train': 1.974739670753479} +11/06/2021 23:04:59 - INFO - __main__ - Step 13285: {'lr': 0.0004928626808793409, 'samples': 2550720, 'steps': 13284, 'loss/train': 1.5590357780456543} +11/06/2021 23:04:59 - INFO - __main__ - Step 13286: {'lr': 0.0004928614218450568, 'samples': 2550912, 'steps': 13285, 'loss/train': 1.4196864366531372} +11/06/2021 23:05:00 - INFO - __main__ - Step 13287: {'lr': 0.000492860162701343, 'samples': 2551104, 'steps': 13286, 'loss/train': 1.4201176166534424} +11/06/2021 23:05:00 - INFO - __main__ - Step 13288: {'lr': 0.0004928589034482001, 'samples': 2551296, 'steps': 13287, 'loss/train': 1.8625463247299194} +11/06/2021 23:05:00 - INFO - __main__ - Step 13289: {'lr': 0.000492857644085629, 'samples': 2551488, 'steps': 13288, 'loss/train': 1.8042540550231934} +11/06/2021 23:05:01 - INFO - __main__ - Step 13290: {'lr': 0.0004928563846136296, 'samples': 2551680, 'steps': 13289, 'loss/train': 1.6024283170700073} +11/06/2021 23:05:02 - INFO - __main__ - Step 13291: {'lr': 0.0004928551250322032, 'samples': 2551872, 'steps': 13290, 'loss/train': 1.5354256629943848} +11/06/2021 23:05:02 - INFO - __main__ - Step 13292: {'lr': 0.0004928538653413499, 'samples': 2552064, 'steps': 13291, 'loss/train': 2.1231536865234375} +11/06/2021 23:05:02 - INFO - __main__ - Step 13293: {'lr': 0.0004928526055410704, 'samples': 2552256, 'steps': 13292, 'loss/train': 1.7034943103790283} +11/06/2021 23:05:03 - INFO - __main__ - Step 13294: {'lr': 0.0004928513456313653, 'samples': 2552448, 'steps': 13293, 'loss/train': 1.6685292720794678} +11/06/2021 23:05:03 - INFO - __main__ - Step 13295: {'lr': 0.000492850085612235, 'samples': 2552640, 'steps': 13294, 'loss/train': 1.6578960418701172} +11/06/2021 23:05:04 - INFO - __main__ - Step 13296: {'lr': 0.0004928488254836804, 'samples': 2552832, 'steps': 13295, 'loss/train': 1.1260663270950317} +11/06/2021 23:05:04 - INFO - __main__ - Step 13297: {'lr': 0.0004928475652457017, 'samples': 2553024, 'steps': 13296, 'loss/train': 1.738349199295044} +11/06/2021 23:05:05 - INFO - __main__ - Step 13298: {'lr': 0.0004928463048982998, 'samples': 2553216, 'steps': 13297, 'loss/train': 1.6107333898544312} +11/06/2021 23:05:05 - INFO - __main__ - Step 13299: {'lr': 0.0004928450444414749, 'samples': 2553408, 'steps': 13298, 'loss/train': 2.0628111362457275} +11/06/2021 23:05:06 - INFO - __main__ - Step 13300: {'lr': 0.0004928437838752278, 'samples': 2553600, 'steps': 13299, 'loss/train': 1.5923441648483276} +11/06/2021 23:05:07 - INFO - __main__ - Step 13301: {'lr': 0.0004928425231995593, 'samples': 2553792, 'steps': 13300, 'loss/train': 1.7554380893707275} +11/06/2021 23:05:07 - INFO - __main__ - Step 13302: {'lr': 0.0004928412624144694, 'samples': 2553984, 'steps': 13301, 'loss/train': 1.8865063190460205} +11/06/2021 23:05:07 - INFO - __main__ - Step 13303: {'lr': 0.0004928400015199591, 'samples': 2554176, 'steps': 13302, 'loss/train': 1.7683358192443848} +11/06/2021 23:05:08 - INFO - __main__ - Step 13304: {'lr': 0.0004928387405160288, 'samples': 2554368, 'steps': 13303, 'loss/train': 1.6909922361373901} +11/06/2021 23:05:08 - INFO - __main__ - Step 13305: {'lr': 0.0004928374794026792, 'samples': 2554560, 'steps': 13304, 'loss/train': 1.3994184732437134} +11/06/2021 23:05:09 - INFO - __main__ - Step 13306: {'lr': 0.0004928362181799107, 'samples': 2554752, 'steps': 13305, 'loss/train': 1.705430030822754} +11/06/2021 23:05:09 - INFO - __main__ - Step 13307: {'lr': 0.0004928349568477239, 'samples': 2554944, 'steps': 13306, 'loss/train': 1.6792200803756714} +11/06/2021 23:05:10 - INFO - __main__ - Step 13308: {'lr': 0.0004928336954061195, 'samples': 2555136, 'steps': 13307, 'loss/train': 1.2497096061706543} +11/06/2021 23:05:10 - INFO - __main__ - Step 13309: {'lr': 0.000492832433855098, 'samples': 2555328, 'steps': 13308, 'loss/train': 1.3893240690231323} +11/06/2021 23:05:10 - INFO - __main__ - Step 13310: {'lr': 0.0004928311721946599, 'samples': 2555520, 'steps': 13309, 'loss/train': 1.5529297590255737} +11/06/2021 23:05:11 - INFO - __main__ - Step 13311: {'lr': 0.0004928299104248059, 'samples': 2555712, 'steps': 13310, 'loss/train': 1.6530280113220215} +11/06/2021 23:05:12 - INFO - __main__ - Step 13312: {'lr': 0.0004928286485455365, 'samples': 2555904, 'steps': 13311, 'loss/train': 1.1228559017181396} +11/06/2021 23:05:12 - INFO - __main__ - Step 13313: {'lr': 0.0004928273865568521, 'samples': 2556096, 'steps': 13312, 'loss/train': 1.5058236122131348} +11/06/2021 23:05:13 - INFO - __main__ - Step 13314: {'lr': 0.0004928261244587536, 'samples': 2556288, 'steps': 13313, 'loss/train': 1.8624576330184937} +11/06/2021 23:05:13 - INFO - __main__ - Step 13315: {'lr': 0.0004928248622512412, 'samples': 2556480, 'steps': 13314, 'loss/train': 1.4049829244613647} +11/06/2021 23:05:14 - INFO - __main__ - Step 13316: {'lr': 0.0004928235999343159, 'samples': 2556672, 'steps': 13315, 'loss/train': 1.9419476985931396} +11/06/2021 23:05:14 - INFO - __main__ - Step 13317: {'lr': 0.0004928223375079778, 'samples': 2556864, 'steps': 13316, 'loss/train': 1.7618058919906616} +11/06/2021 23:05:14 - INFO - __main__ - Step 13318: {'lr': 0.0004928210749722278, 'samples': 2557056, 'steps': 13317, 'loss/train': 1.606778621673584} +11/06/2021 23:05:15 - INFO - __main__ - Step 13319: {'lr': 0.0004928198123270664, 'samples': 2557248, 'steps': 13318, 'loss/train': 1.5688247680664062} +11/06/2021 23:05:15 - INFO - __main__ - Step 13320: {'lr': 0.0004928185495724942, 'samples': 2557440, 'steps': 13319, 'loss/train': 1.9147883653640747} +11/06/2021 23:05:16 - INFO - __main__ - Step 13321: {'lr': 0.0004928172867085115, 'samples': 2557632, 'steps': 13320, 'loss/train': 1.3374717235565186} +11/06/2021 23:05:17 - INFO - __main__ - Step 13322: {'lr': 0.0004928160237351192, 'samples': 2557824, 'steps': 13321, 'loss/train': 1.7408499717712402} +11/06/2021 23:05:17 - INFO - __main__ - Step 13323: {'lr': 0.0004928147606523179, 'samples': 2558016, 'steps': 13322, 'loss/train': 1.20220947265625} +11/06/2021 23:05:17 - INFO - __main__ - Step 13324: {'lr': 0.0004928134974601078, 'samples': 2558208, 'steps': 13323, 'loss/train': 1.730553388595581} +11/06/2021 23:05:18 - INFO - __main__ - Step 13325: {'lr': 0.0004928122341584897, 'samples': 2558400, 'steps': 13324, 'loss/train': 1.704958200454712} +11/06/2021 23:05:18 - INFO - __main__ - Step 13326: {'lr': 0.0004928109707474643, 'samples': 2558592, 'steps': 13325, 'loss/train': 1.6393741369247437} +11/06/2021 23:05:19 - INFO - __main__ - Step 13327: {'lr': 0.0004928097072270319, 'samples': 2558784, 'steps': 13326, 'loss/train': 1.696864366531372} +11/06/2021 23:05:19 - INFO - __main__ - Step 13328: {'lr': 0.0004928084435971932, 'samples': 2558976, 'steps': 13327, 'loss/train': 1.6887147426605225} +11/06/2021 23:05:20 - INFO - __main__ - Step 13329: {'lr': 0.0004928071798579488, 'samples': 2559168, 'steps': 13328, 'loss/train': 1.7880932092666626} +11/06/2021 23:05:20 - INFO - __main__ - Step 13330: {'lr': 0.0004928059160092993, 'samples': 2559360, 'steps': 13329, 'loss/train': 1.7646552324295044} +11/06/2021 23:05:20 - INFO - __main__ - Step 13331: {'lr': 0.000492804652051245, 'samples': 2559552, 'steps': 13330, 'loss/train': 1.588904857635498} +11/06/2021 23:05:22 - INFO - __main__ - Step 13332: {'lr': 0.0004928033879837868, 'samples': 2559744, 'steps': 13331, 'loss/train': 1.295880675315857} +11/06/2021 23:05:22 - INFO - __main__ - Step 13333: {'lr': 0.0004928021238069251, 'samples': 2559936, 'steps': 13332, 'loss/train': 1.5167969465255737} +11/06/2021 23:05:22 - INFO - __main__ - Step 13334: {'lr': 0.0004928008595206605, 'samples': 2560128, 'steps': 13333, 'loss/train': 0.6749269366264343} +11/06/2021 23:05:23 - INFO - __main__ - Step 13335: {'lr': 0.0004927995951249937, 'samples': 2560320, 'steps': 13334, 'loss/train': 1.3417226076126099} +11/06/2021 23:05:23 - INFO - __main__ - Step 13336: {'lr': 0.0004927983306199251, 'samples': 2560512, 'steps': 13335, 'loss/train': 0.18615388870239258} +11/06/2021 23:05:24 - INFO - __main__ - Step 13337: {'lr': 0.0004927970660054552, 'samples': 2560704, 'steps': 13336, 'loss/train': 1.5057356357574463} +11/06/2021 23:05:25 - INFO - __main__ - Step 13338: {'lr': 0.0004927958012815849, 'samples': 2560896, 'steps': 13337, 'loss/train': 1.761964201927185} +11/06/2021 23:05:25 - INFO - __main__ - Step 13339: {'lr': 0.0004927945364483144, 'samples': 2561088, 'steps': 13338, 'loss/train': 1.5232926607131958} +11/06/2021 23:05:25 - INFO - __main__ - Step 13340: {'lr': 0.0004927932715056444, 'samples': 2561280, 'steps': 13339, 'loss/train': 1.5843162536621094} +11/06/2021 23:05:26 - INFO - __main__ - Step 13341: {'lr': 0.0004927920064535756, 'samples': 2561472, 'steps': 13340, 'loss/train': 1.808425784111023} +11/06/2021 23:05:27 - INFO - __main__ - Step 13342: {'lr': 0.0004927907412921084, 'samples': 2561664, 'steps': 13341, 'loss/train': 1.7012680768966675} +11/06/2021 23:05:27 - INFO - __main__ - Step 13343: {'lr': 0.0004927894760212435, 'samples': 2561856, 'steps': 13342, 'loss/train': 1.866380214691162} +11/06/2021 23:05:27 - INFO - __main__ - Step 13344: {'lr': 0.0004927882106409813, 'samples': 2562048, 'steps': 13343, 'loss/train': 0.6757373213768005} +11/06/2021 23:05:28 - INFO - __main__ - Step 13345: {'lr': 0.0004927869451513226, 'samples': 2562240, 'steps': 13344, 'loss/train': 1.5792934894561768} +11/06/2021 23:05:28 - INFO - __main__ - Step 13346: {'lr': 0.0004927856795522678, 'samples': 2562432, 'steps': 13345, 'loss/train': 1.1496813297271729} +11/06/2021 23:05:29 - INFO - __main__ - Step 13347: {'lr': 0.0004927844138438175, 'samples': 2562624, 'steps': 13346, 'loss/train': 1.646971344947815} +11/06/2021 23:05:29 - INFO - __main__ - Step 13348: {'lr': 0.0004927831480259723, 'samples': 2562816, 'steps': 13347, 'loss/train': 1.720847725868225} +11/06/2021 23:05:30 - INFO - __main__ - Step 13349: {'lr': 0.0004927818820987328, 'samples': 2563008, 'steps': 13348, 'loss/train': 1.679519534111023} +11/06/2021 23:05:30 - INFO - __main__ - Step 13350: {'lr': 0.0004927806160620995, 'samples': 2563200, 'steps': 13349, 'loss/train': 2.182821750640869} +11/06/2021 23:05:30 - INFO - __main__ - Step 13351: {'lr': 0.0004927793499160729, 'samples': 2563392, 'steps': 13350, 'loss/train': 2.1079049110412598} +11/06/2021 23:05:31 - INFO - __main__ - Step 13352: {'lr': 0.000492778083660654, 'samples': 2563584, 'steps': 13351, 'loss/train': 1.3878504037857056} +11/06/2021 23:05:32 - INFO - __main__ - Step 13353: {'lr': 0.0004927768172958427, 'samples': 2563776, 'steps': 13352, 'loss/train': 1.9145451784133911} +11/06/2021 23:05:32 - INFO - __main__ - Step 13354: {'lr': 0.00049277555082164, 'samples': 2563968, 'steps': 13353, 'loss/train': 1.463181495666504} +11/06/2021 23:05:33 - INFO - __main__ - Step 13355: {'lr': 0.0004927742842380465, 'samples': 2564160, 'steps': 13354, 'loss/train': 2.1269948482513428} +11/06/2021 23:05:33 - INFO - __main__ - Step 13356: {'lr': 0.0004927730175450626, 'samples': 2564352, 'steps': 13355, 'loss/train': 1.5894335508346558} +11/06/2021 23:05:34 - INFO - __main__ - Step 13357: {'lr': 0.0004927717507426887, 'samples': 2564544, 'steps': 13356, 'loss/train': 1.5174648761749268} +11/06/2021 23:05:34 - INFO - __main__ - Step 13358: {'lr': 0.0004927704838309259, 'samples': 2564736, 'steps': 13357, 'loss/train': 1.6864207983016968} +11/06/2021 23:05:35 - INFO - __main__ - Step 13359: {'lr': 0.0004927692168097743, 'samples': 2564928, 'steps': 13358, 'loss/train': 1.3122807741165161} +11/06/2021 23:05:35 - INFO - __main__ - Step 13360: {'lr': 0.0004927679496792347, 'samples': 2565120, 'steps': 13359, 'loss/train': 1.738892674446106} +11/06/2021 23:05:35 - INFO - __main__ - Step 13361: {'lr': 0.0004927666824393076, 'samples': 2565312, 'steps': 13360, 'loss/train': 0.4052657186985016} +11/06/2021 23:05:36 - INFO - __main__ - Step 13362: {'lr': 0.0004927654150899937, 'samples': 2565504, 'steps': 13361, 'loss/train': 2.3916163444519043} +11/06/2021 23:05:37 - INFO - __main__ - Step 13363: {'lr': 0.0004927641476312932, 'samples': 2565696, 'steps': 13362, 'loss/train': 1.5969182252883911} +11/06/2021 23:05:37 - INFO - __main__ - Step 13364: {'lr': 0.000492762880063207, 'samples': 2565888, 'steps': 13363, 'loss/train': 1.332525610923767} +11/06/2021 23:05:37 - INFO - __main__ - Step 13365: {'lr': 0.0004927616123857357, 'samples': 2566080, 'steps': 13364, 'loss/train': 1.9494463205337524} +11/06/2021 23:05:38 - INFO - __main__ - Step 13366: {'lr': 0.0004927603445988797, 'samples': 2566272, 'steps': 13365, 'loss/train': 1.918675422668457} +11/06/2021 23:05:39 - INFO - __main__ - Step 13367: {'lr': 0.0004927590767026396, 'samples': 2566464, 'steps': 13366, 'loss/train': 2.5392587184906006} +11/06/2021 23:05:39 - INFO - __main__ - Step 13368: {'lr': 0.0004927578086970161, 'samples': 2566656, 'steps': 13367, 'loss/train': 1.7140586376190186} +11/06/2021 23:05:39 - INFO - __main__ - Step 13369: {'lr': 0.0004927565405820096, 'samples': 2566848, 'steps': 13368, 'loss/train': 1.7201263904571533} +11/06/2021 23:05:40 - INFO - __main__ - Step 13370: {'lr': 0.0004927552723576207, 'samples': 2567040, 'steps': 13369, 'loss/train': 1.939740777015686} +11/06/2021 23:05:40 - INFO - __main__ - Step 13371: {'lr': 0.0004927540040238501, 'samples': 2567232, 'steps': 13370, 'loss/train': 1.2085801362991333} +11/06/2021 23:05:41 - INFO - __main__ - Step 13372: {'lr': 0.0004927527355806983, 'samples': 2567424, 'steps': 13371, 'loss/train': 1.3057010173797607} +11/06/2021 23:05:41 - INFO - __main__ - Step 13373: {'lr': 0.0004927514670281659, 'samples': 2567616, 'steps': 13372, 'loss/train': 1.3879728317260742} +11/06/2021 23:05:42 - INFO - __main__ - Step 13374: {'lr': 0.0004927501983662534, 'samples': 2567808, 'steps': 13373, 'loss/train': 2.229905128479004} +11/06/2021 23:05:42 - INFO - __main__ - Step 13375: {'lr': 0.0004927489295949613, 'samples': 2568000, 'steps': 13374, 'loss/train': 1.403855562210083} +11/06/2021 23:05:43 - INFO - __main__ - Step 13376: {'lr': 0.0004927476607142904, 'samples': 2568192, 'steps': 13375, 'loss/train': 1.8529839515686035} +11/06/2021 23:05:44 - INFO - __main__ - Step 13377: {'lr': 0.0004927463917242411, 'samples': 2568384, 'steps': 13376, 'loss/train': 1.6956440210342407} +11/06/2021 23:05:44 - INFO - __main__ - Step 13378: {'lr': 0.0004927451226248141, 'samples': 2568576, 'steps': 13377, 'loss/train': 1.5961147546768188} +11/06/2021 23:05:44 - INFO - __main__ - Step 13379: {'lr': 0.0004927438534160098, 'samples': 2568768, 'steps': 13378, 'loss/train': 1.2757984399795532} +11/06/2021 23:05:45 - INFO - __main__ - Step 13380: {'lr': 0.0004927425840978289, 'samples': 2568960, 'steps': 13379, 'loss/train': 1.361778736114502} +11/06/2021 23:05:45 - INFO - __main__ - Step 13381: {'lr': 0.0004927413146702719, 'samples': 2569152, 'steps': 13380, 'loss/train': 1.2567278146743774} +11/06/2021 23:05:45 - INFO - __main__ - Step 13382: {'lr': 0.0004927400451333394, 'samples': 2569344, 'steps': 13381, 'loss/train': 1.9279859066009521} +11/06/2021 23:05:46 - INFO - __main__ - Step 13383: {'lr': 0.0004927387754870321, 'samples': 2569536, 'steps': 13382, 'loss/train': 0.35177692770957947} +11/06/2021 23:05:47 - INFO - __main__ - Step 13384: {'lr': 0.0004927375057313504, 'samples': 2569728, 'steps': 13383, 'loss/train': 2.1717875003814697} +11/06/2021 23:05:47 - INFO - __main__ - Step 13385: {'lr': 0.0004927362358662948, 'samples': 2569920, 'steps': 13384, 'loss/train': 1.7761980295181274} +11/06/2021 23:05:47 - INFO - __main__ - Step 13386: {'lr': 0.0004927349658918662, 'samples': 2570112, 'steps': 13385, 'loss/train': 1.3248966932296753} +11/06/2021 23:05:48 - INFO - __main__ - Step 13387: {'lr': 0.0004927336958080648, 'samples': 2570304, 'steps': 13386, 'loss/train': 1.88877272605896} +11/06/2021 23:05:49 - INFO - __main__ - Step 13388: {'lr': 0.0004927324256148914, 'samples': 2570496, 'steps': 13387, 'loss/train': 1.2974435091018677} +11/06/2021 23:05:49 - INFO - __main__ - Step 13389: {'lr': 0.0004927311553123465, 'samples': 2570688, 'steps': 13388, 'loss/train': 1.5624191761016846} +11/06/2021 23:05:50 - INFO - __main__ - Step 13390: {'lr': 0.0004927298849004307, 'samples': 2570880, 'steps': 13389, 'loss/train': 1.5980331897735596} +11/06/2021 23:05:50 - INFO - __main__ - Step 13391: {'lr': 0.0004927286143791447, 'samples': 2571072, 'steps': 13390, 'loss/train': 2.0183682441711426} +11/06/2021 23:05:50 - INFO - __main__ - Step 13392: {'lr': 0.0004927273437484888, 'samples': 2571264, 'steps': 13391, 'loss/train': 1.7328522205352783} +11/06/2021 23:05:51 - INFO - __main__ - Step 13393: {'lr': 0.0004927260730084636, 'samples': 2571456, 'steps': 13392, 'loss/train': 1.669248342514038} +11/06/2021 23:05:52 - INFO - __main__ - Step 13394: {'lr': 0.0004927248021590699, 'samples': 2571648, 'steps': 13393, 'loss/train': 2.133970022201538} +11/06/2021 23:05:52 - INFO - __main__ - Step 13395: {'lr': 0.0004927235312003082, 'samples': 2571840, 'steps': 13394, 'loss/train': 1.0649173259735107} +11/06/2021 23:05:52 - INFO - __main__ - Step 13396: {'lr': 0.0004927222601321789, 'samples': 2572032, 'steps': 13395, 'loss/train': 2.6536405086517334} +11/06/2021 23:05:53 - INFO - __main__ - Step 13397: {'lr': 0.0004927209889546828, 'samples': 2572224, 'steps': 13396, 'loss/train': 1.37748122215271} +11/06/2021 23:05:54 - INFO - __main__ - Step 13398: {'lr': 0.0004927197176678203, 'samples': 2572416, 'steps': 13397, 'loss/train': 1.8754839897155762} +11/06/2021 23:05:54 - INFO - __main__ - Step 13399: {'lr': 0.000492718446271592, 'samples': 2572608, 'steps': 13398, 'loss/train': 1.372225284576416} +11/06/2021 23:05:55 - INFO - __main__ - Step 13400: {'lr': 0.0004927171747659986, 'samples': 2572800, 'steps': 13399, 'loss/train': 1.8654577732086182} +11/06/2021 23:05:55 - INFO - __main__ - Step 13401: {'lr': 0.0004927159031510405, 'samples': 2572992, 'steps': 13400, 'loss/train': 0.6154890060424805} +11/06/2021 23:05:55 - INFO - __main__ - Step 13402: {'lr': 0.0004927146314267184, 'samples': 2573184, 'steps': 13401, 'loss/train': 1.4731422662734985} +11/06/2021 23:05:57 - INFO - __main__ - Step 13403: {'lr': 0.000492713359593033, 'samples': 2573376, 'steps': 13402, 'loss/train': 1.8210397958755493} +11/06/2021 23:05:57 - INFO - __main__ - Step 13404: {'lr': 0.0004927120876499846, 'samples': 2573568, 'steps': 13403, 'loss/train': 2.1863057613372803} +11/06/2021 23:05:57 - INFO - __main__ - Step 13405: {'lr': 0.0004927108155975738, 'samples': 2573760, 'steps': 13404, 'loss/train': 1.5386931896209717} +11/06/2021 23:05:58 - INFO - __main__ - Step 13406: {'lr': 0.0004927095434358012, 'samples': 2573952, 'steps': 13405, 'loss/train': 2.4172680377960205} +11/06/2021 23:05:58 - INFO - __main__ - Step 13407: {'lr': 0.0004927082711646676, 'samples': 2574144, 'steps': 13406, 'loss/train': 1.7488776445388794} +11/06/2021 23:05:58 - INFO - __main__ - Step 13408: {'lr': 0.0004927069987841733, 'samples': 2574336, 'steps': 13407, 'loss/train': 2.008625030517578} +11/06/2021 23:05:59 - INFO - __main__ - Step 13409: {'lr': 0.0004927057262943189, 'samples': 2574528, 'steps': 13408, 'loss/train': 1.6773982048034668} +11/06/2021 23:06:00 - INFO - __main__ - Step 13410: {'lr': 0.0004927044536951052, 'samples': 2574720, 'steps': 13409, 'loss/train': 2.1111257076263428} +11/06/2021 23:06:00 - INFO - __main__ - Step 13411: {'lr': 0.0004927031809865324, 'samples': 2574912, 'steps': 13410, 'loss/train': 1.8370585441589355} +11/06/2021 23:06:00 - INFO - __main__ - Step 13412: {'lr': 0.0004927019081686015, 'samples': 2575104, 'steps': 13411, 'loss/train': 1.4143866300582886} +11/06/2021 23:06:01 - INFO - __main__ - Step 13413: {'lr': 0.0004927006352413128, 'samples': 2575296, 'steps': 13412, 'loss/train': 1.1940877437591553} +11/06/2021 23:06:02 - INFO - __main__ - Step 13414: {'lr': 0.000492699362204667, 'samples': 2575488, 'steps': 13413, 'loss/train': 1.8130630254745483} +11/06/2021 23:06:02 - INFO - __main__ - Step 13415: {'lr': 0.0004926980890586645, 'samples': 2575680, 'steps': 13414, 'loss/train': 1.6337990760803223} +11/06/2021 23:06:02 - INFO - __main__ - Step 13416: {'lr': 0.000492696815803306, 'samples': 2575872, 'steps': 13415, 'loss/train': 1.7381833791732788} +11/06/2021 23:06:03 - INFO - __main__ - Step 13417: {'lr': 0.0004926955424385921, 'samples': 2576064, 'steps': 13416, 'loss/train': 1.8581897020339966} +11/06/2021 23:06:03 - INFO - __main__ - Step 13418: {'lr': 0.0004926942689645234, 'samples': 2576256, 'steps': 13417, 'loss/train': 0.9027330875396729} +11/06/2021 23:06:04 - INFO - __main__ - Step 13419: {'lr': 0.0004926929953811003, 'samples': 2576448, 'steps': 13418, 'loss/train': 1.8112411499023438} +11/06/2021 23:06:05 - INFO - __main__ - Step 13420: {'lr': 0.0004926917216883235, 'samples': 2576640, 'steps': 13419, 'loss/train': 1.7219598293304443} +11/06/2021 23:06:05 - INFO - __main__ - Step 13421: {'lr': 0.0004926904478861937, 'samples': 2576832, 'steps': 13420, 'loss/train': 1.8902779817581177} +11/06/2021 23:06:05 - INFO - __main__ - Step 13422: {'lr': 0.0004926891739747111, 'samples': 2577024, 'steps': 13421, 'loss/train': 1.9297341108322144} +11/06/2021 23:06:06 - INFO - __main__ - Step 13423: {'lr': 0.0004926878999538766, 'samples': 2577216, 'steps': 13422, 'loss/train': 1.187242865562439} +11/06/2021 23:06:07 - INFO - __main__ - Step 13424: {'lr': 0.0004926866258236907, 'samples': 2577408, 'steps': 13423, 'loss/train': 2.304779529571533} +11/06/2021 23:06:07 - INFO - __main__ - Step 13425: {'lr': 0.000492685351584154, 'samples': 2577600, 'steps': 13424, 'loss/train': 2.2769415378570557} +11/06/2021 23:06:07 - INFO - __main__ - Step 13426: {'lr': 0.000492684077235267, 'samples': 2577792, 'steps': 13425, 'loss/train': 0.9876941442489624} +11/06/2021 23:06:08 - INFO - __main__ - Step 13427: {'lr': 0.0004926828027770302, 'samples': 2577984, 'steps': 13426, 'loss/train': 1.4643722772598267} +11/06/2021 23:06:08 - INFO - __main__ - Step 13428: {'lr': 0.0004926815282094443, 'samples': 2578176, 'steps': 13427, 'loss/train': 2.2351608276367188} +11/06/2021 23:06:09 - INFO - __main__ - Step 13429: {'lr': 0.00049268025353251, 'samples': 2578368, 'steps': 13428, 'loss/train': 1.725936770439148} +11/06/2021 23:06:09 - INFO - __main__ - Step 13430: {'lr': 0.0004926789787462276, 'samples': 2578560, 'steps': 13429, 'loss/train': 1.8152636289596558} +11/06/2021 23:06:10 - INFO - __main__ - Step 13431: {'lr': 0.0004926777038505978, 'samples': 2578752, 'steps': 13430, 'loss/train': 1.673268437385559} +11/06/2021 23:06:10 - INFO - __main__ - Step 13432: {'lr': 0.0004926764288456212, 'samples': 2578944, 'steps': 13431, 'loss/train': 1.6883317232131958} +11/06/2021 23:06:10 - INFO - __main__ - Step 13433: {'lr': 0.0004926751537312982, 'samples': 2579136, 'steps': 13432, 'loss/train': 1.6265524625778198} +11/06/2021 23:06:11 - INFO - __main__ - Step 13434: {'lr': 0.0004926738785076297, 'samples': 2579328, 'steps': 13433, 'loss/train': 1.6185946464538574} +11/06/2021 23:06:12 - INFO - __main__ - Step 13435: {'lr': 0.000492672603174616, 'samples': 2579520, 'steps': 13434, 'loss/train': 1.6138404607772827} +11/06/2021 23:06:12 - INFO - __main__ - Step 13436: {'lr': 0.0004926713277322579, 'samples': 2579712, 'steps': 13435, 'loss/train': 1.8457807302474976} +11/06/2021 23:06:13 - INFO - __main__ - Step 13437: {'lr': 0.0004926700521805557, 'samples': 2579904, 'steps': 13436, 'loss/train': 1.5972094535827637} +11/06/2021 23:06:13 - INFO - __main__ - Step 13438: {'lr': 0.0004926687765195102, 'samples': 2580096, 'steps': 13437, 'loss/train': 1.67529296875} +11/06/2021 23:06:14 - INFO - __main__ - Step 13439: {'lr': 0.0004926675007491218, 'samples': 2580288, 'steps': 13438, 'loss/train': 1.481308937072754} +11/06/2021 23:06:14 - INFO - __main__ - Step 13440: {'lr': 0.0004926662248693912, 'samples': 2580480, 'steps': 13439, 'loss/train': 1.9427311420440674} +11/06/2021 23:06:15 - INFO - __main__ - Step 13441: {'lr': 0.000492664948880319, 'samples': 2580672, 'steps': 13440, 'loss/train': 1.513269305229187} +11/06/2021 23:06:15 - INFO - __main__ - Step 13442: {'lr': 0.0004926636727819057, 'samples': 2580864, 'steps': 13441, 'loss/train': 2.367624282836914} +11/06/2021 23:06:15 - INFO - __main__ - Step 13443: {'lr': 0.0004926623965741519, 'samples': 2581056, 'steps': 13442, 'loss/train': 1.679581880569458} +11/06/2021 23:06:16 - INFO - __main__ - Step 13444: {'lr': 0.0004926611202570582, 'samples': 2581248, 'steps': 13443, 'loss/train': 1.8118009567260742} +11/06/2021 23:06:17 - INFO - __main__ - Step 13445: {'lr': 0.0004926598438306252, 'samples': 2581440, 'steps': 13444, 'loss/train': 1.1700359582901} +11/06/2021 23:06:17 - INFO - __main__ - Step 13446: {'lr': 0.0004926585672948532, 'samples': 2581632, 'steps': 13445, 'loss/train': 1.750053882598877} +11/06/2021 23:06:17 - INFO - __main__ - Step 13447: {'lr': 0.0004926572906497432, 'samples': 2581824, 'steps': 13446, 'loss/train': 1.81050705909729} +11/06/2021 23:06:18 - INFO - __main__ - Step 13448: {'lr': 0.0004926560138952955, 'samples': 2582016, 'steps': 13447, 'loss/train': 1.7286831140518188} +11/06/2021 23:06:19 - INFO - __main__ - Step 13449: {'lr': 0.0004926547370315106, 'samples': 2582208, 'steps': 13448, 'loss/train': 1.6813172101974487} +11/06/2021 23:06:19 - INFO - __main__ - Step 13450: {'lr': 0.0004926534600583894, 'samples': 2582400, 'steps': 13449, 'loss/train': 3.3553547859191895} +11/06/2021 23:06:20 - INFO - __main__ - Step 13451: {'lr': 0.0004926521829759323, 'samples': 2582592, 'steps': 13450, 'loss/train': 2.9841389656066895} +11/06/2021 23:06:20 - INFO - __main__ - Step 13452: {'lr': 0.0004926509057841397, 'samples': 2582784, 'steps': 13451, 'loss/train': 2.232959032058716} +11/06/2021 23:06:20 - INFO - __main__ - Step 13453: {'lr': 0.0004926496284830125, 'samples': 2582976, 'steps': 13452, 'loss/train': 0.9120754599571228} +11/06/2021 23:06:21 - INFO - __main__ - Step 13454: {'lr': 0.0004926483510725511, 'samples': 2583168, 'steps': 13453, 'loss/train': 0.20907138288021088} +11/06/2021 23:06:22 - INFO - __main__ - Step 13455: {'lr': 0.000492647073552756, 'samples': 2583360, 'steps': 13454, 'loss/train': 0.17836831510066986} +11/06/2021 23:06:22 - INFO - __main__ - Step 13456: {'lr': 0.000492645795923628, 'samples': 2583552, 'steps': 13455, 'loss/train': 1.9313207864761353} +11/06/2021 23:06:23 - INFO - __main__ - Step 13457: {'lr': 0.0004926445181851675, 'samples': 2583744, 'steps': 13456, 'loss/train': 1.514086365699768} +11/06/2021 23:06:23 - INFO - __main__ - Step 13458: {'lr': 0.0004926432403373752, 'samples': 2583936, 'steps': 13457, 'loss/train': 2.219507932662964} +11/06/2021 23:06:23 - INFO - __main__ - Step 13459: {'lr': 0.0004926419623802515, 'samples': 2584128, 'steps': 13458, 'loss/train': 1.9155421257019043} +11/06/2021 23:06:24 - INFO - __main__ - Step 13460: {'lr': 0.0004926406843137971, 'samples': 2584320, 'steps': 13459, 'loss/train': 1.7302833795547485} +11/06/2021 23:06:25 - INFO - __main__ - Step 13461: {'lr': 0.0004926394061380126, 'samples': 2584512, 'steps': 13460, 'loss/train': 1.796723484992981} +11/06/2021 23:06:25 - INFO - __main__ - Step 13462: {'lr': 0.0004926381278528984, 'samples': 2584704, 'steps': 13461, 'loss/train': 1.6994954347610474} +11/06/2021 23:06:25 - INFO - __main__ - Step 13463: {'lr': 0.0004926368494584553, 'samples': 2584896, 'steps': 13462, 'loss/train': 0.4757920205593109} +11/06/2021 23:06:26 - INFO - __main__ - Step 13464: {'lr': 0.0004926355709546838, 'samples': 2585088, 'steps': 13463, 'loss/train': 1.7972795963287354} +11/06/2021 23:06:26 - INFO - __main__ - Step 13465: {'lr': 0.0004926342923415844, 'samples': 2585280, 'steps': 13464, 'loss/train': 1.8750228881835938} +11/06/2021 23:06:27 - INFO - __main__ - Step 13466: {'lr': 0.0004926330136191577, 'samples': 2585472, 'steps': 13465, 'loss/train': 2.082622766494751} +11/06/2021 23:06:28 - INFO - __main__ - Step 13467: {'lr': 0.0004926317347874044, 'samples': 2585664, 'steps': 13466, 'loss/train': 1.9300429821014404} +11/06/2021 23:06:28 - INFO - __main__ - Step 13468: {'lr': 0.000492630455846325, 'samples': 2585856, 'steps': 13467, 'loss/train': 1.32011079788208} +11/06/2021 23:06:28 - INFO - __main__ - Step 13469: {'lr': 0.0004926291767959199, 'samples': 2586048, 'steps': 13468, 'loss/train': 3.767948865890503} +11/06/2021 23:06:29 - INFO - __main__ - Step 13470: {'lr': 0.00049262789763619, 'samples': 2586240, 'steps': 13469, 'loss/train': 1.0086846351623535} +11/06/2021 23:06:30 - INFO - __main__ - Step 13471: {'lr': 0.0004926266183671356, 'samples': 2586432, 'steps': 13470, 'loss/train': 1.8389583826065063} +11/06/2021 23:06:30 - INFO - __main__ - Step 13472: {'lr': 0.0004926253389887575, 'samples': 2586624, 'steps': 13471, 'loss/train': 1.7652056217193604} +11/06/2021 23:06:31 - INFO - __main__ - Step 13473: {'lr': 0.0004926240595010561, 'samples': 2586816, 'steps': 13472, 'loss/train': 1.13629949092865} +11/06/2021 23:06:31 - INFO - __main__ - Step 13474: {'lr': 0.000492622779904032, 'samples': 2587008, 'steps': 13473, 'loss/train': 1.531381368637085} +11/06/2021 23:06:31 - INFO - __main__ - Step 13475: {'lr': 0.000492621500197686, 'samples': 2587200, 'steps': 13474, 'loss/train': 1.4940797090530396} +11/06/2021 23:06:32 - INFO - __main__ - Step 13476: {'lr': 0.0004926202203820182, 'samples': 2587392, 'steps': 13475, 'loss/train': 1.8899670839309692} +11/06/2021 23:06:33 - INFO - __main__ - Step 13477: {'lr': 0.0004926189404570297, 'samples': 2587584, 'steps': 13476, 'loss/train': 1.735036015510559} +11/06/2021 23:06:33 - INFO - __main__ - Step 13478: {'lr': 0.0004926176604227208, 'samples': 2587776, 'steps': 13477, 'loss/train': 1.7047059535980225} +11/06/2021 23:06:33 - INFO - __main__ - Step 13479: {'lr': 0.0004926163802790922, 'samples': 2587968, 'steps': 13478, 'loss/train': 2.1699039936065674} +11/06/2021 23:06:34 - INFO - __main__ - Step 13480: {'lr': 0.0004926151000261442, 'samples': 2588160, 'steps': 13479, 'loss/train': 1.8087481260299683} +11/06/2021 23:06:34 - INFO - __main__ - Step 13481: {'lr': 0.0004926138196638777, 'samples': 2588352, 'steps': 13480, 'loss/train': 1.056817889213562} +11/06/2021 23:06:35 - INFO - __main__ - Step 13482: {'lr': 0.0004926125391922932, 'samples': 2588544, 'steps': 13481, 'loss/train': 1.3383749723434448} +11/06/2021 23:06:36 - INFO - __main__ - Step 13483: {'lr': 0.0004926112586113912, 'samples': 2588736, 'steps': 13482, 'loss/train': 1.4926176071166992} +11/06/2021 23:06:36 - INFO - __main__ - Step 13484: {'lr': 0.0004926099779211723, 'samples': 2588928, 'steps': 13483, 'loss/train': 1.5623829364776611} +11/06/2021 23:06:36 - INFO - __main__ - Step 13485: {'lr': 0.0004926086971216371, 'samples': 2589120, 'steps': 13484, 'loss/train': 1.7945960760116577} +11/06/2021 23:06:37 - INFO - __main__ - Step 13486: {'lr': 0.0004926074162127862, 'samples': 2589312, 'steps': 13485, 'loss/train': 1.6965285539627075} +11/06/2021 23:06:38 - INFO - __main__ - Step 13487: {'lr': 0.0004926061351946201, 'samples': 2589504, 'steps': 13486, 'loss/train': 2.568559169769287} +11/06/2021 23:06:39 - INFO - __main__ - Step 13488: {'lr': 0.0004926048540671394, 'samples': 2589696, 'steps': 13487, 'loss/train': 0.929760754108429} +11/06/2021 23:06:39 - INFO - __main__ - Step 13489: {'lr': 0.0004926035728303447, 'samples': 2589888, 'steps': 13488, 'loss/train': 1.9634153842926025} +11/06/2021 23:06:39 - INFO - __main__ - Step 13490: {'lr': 0.0004926022914842366, 'samples': 2590080, 'steps': 13489, 'loss/train': 0.19946490228176117} +11/06/2021 23:06:40 - INFO - __main__ - Step 13491: {'lr': 0.0004926010100288156, 'samples': 2590272, 'steps': 13490, 'loss/train': 1.7599334716796875} +11/06/2021 23:06:41 - INFO - __main__ - Step 13492: {'lr': 0.0004925997284640823, 'samples': 2590464, 'steps': 13491, 'loss/train': 1.668752908706665} +11/06/2021 23:06:41 - INFO - __main__ - Step 13493: {'lr': 0.0004925984467900374, 'samples': 2590656, 'steps': 13492, 'loss/train': 1.4135771989822388} +11/06/2021 23:06:41 - INFO - __main__ - Step 13494: {'lr': 0.0004925971650066814, 'samples': 2590848, 'steps': 13493, 'loss/train': 2.2493417263031006} +11/06/2021 23:06:42 - INFO - __main__ - Step 13495: {'lr': 0.0004925958831140147, 'samples': 2591040, 'steps': 13494, 'loss/train': 1.576822280883789} +11/06/2021 23:06:42 - INFO - __main__ - Step 13496: {'lr': 0.0004925946011120382, 'samples': 2591232, 'steps': 13495, 'loss/train': 2.3239166736602783} +11/06/2021 23:06:43 - INFO - __main__ - Step 13497: {'lr': 0.0004925933190007523, 'samples': 2591424, 'steps': 13496, 'loss/train': 1.5112223625183105} +11/06/2021 23:06:44 - INFO - __main__ - Step 13498: {'lr': 0.0004925920367801575, 'samples': 2591616, 'steps': 13497, 'loss/train': 1.7464356422424316} +11/06/2021 23:06:44 - INFO - __main__ - Step 13499: {'lr': 0.0004925907544502545, 'samples': 2591808, 'steps': 13498, 'loss/train': 1.7748905420303345} +11/06/2021 23:06:44 - INFO - __main__ - Step 13500: {'lr': 0.000492589472011044, 'samples': 2592000, 'steps': 13499, 'loss/train': 2.0992441177368164} +11/06/2021 23:06:45 - INFO - __main__ - Step 13501: {'lr': 0.0004925881894625263, 'samples': 2592192, 'steps': 13500, 'loss/train': 1.2124189138412476} +11/06/2021 23:06:46 - INFO - __main__ - Step 13502: {'lr': 0.0004925869068047021, 'samples': 2592384, 'steps': 13501, 'loss/train': 1.7404388189315796} +11/06/2021 23:06:46 - INFO - __main__ - Step 13503: {'lr': 0.000492585624037572, 'samples': 2592576, 'steps': 13502, 'loss/train': 1.5108038187026978} +11/06/2021 23:06:46 - INFO - __main__ - Step 13504: {'lr': 0.0004925843411611366, 'samples': 2592768, 'steps': 13503, 'loss/train': 1.60819673538208} +11/06/2021 23:06:47 - INFO - __main__ - Step 13505: {'lr': 0.0004925830581753964, 'samples': 2592960, 'steps': 13504, 'loss/train': 2.066511631011963} +11/06/2021 23:06:47 - INFO - __main__ - Step 13506: {'lr': 0.000492581775080352, 'samples': 2593152, 'steps': 13505, 'loss/train': 1.5650289058685303} +11/06/2021 23:06:48 - INFO - __main__ - Step 13507: {'lr': 0.000492580491876004, 'samples': 2593344, 'steps': 13506, 'loss/train': 1.7949551343917847} +11/06/2021 23:06:48 - INFO - __main__ - Step 13508: {'lr': 0.000492579208562353, 'samples': 2593536, 'steps': 13507, 'loss/train': 1.567403793334961} +11/06/2021 23:06:49 - INFO - __main__ - Step 13509: {'lr': 0.0004925779251393995, 'samples': 2593728, 'steps': 13508, 'loss/train': 2.0398895740509033} +11/06/2021 23:06:49 - INFO - __main__ - Step 13510: {'lr': 0.0004925766416071441, 'samples': 2593920, 'steps': 13509, 'loss/train': 1.7081353664398193} +11/06/2021 23:06:49 - INFO - __main__ - Step 13511: {'lr': 0.0004925753579655876, 'samples': 2594112, 'steps': 13510, 'loss/train': 1.5593316555023193} +11/06/2021 23:06:51 - INFO - __main__ - Step 13512: {'lr': 0.0004925740742147302, 'samples': 2594304, 'steps': 13511, 'loss/train': 1.8523802757263184} +11/06/2021 23:06:51 - INFO - __main__ - Step 13513: {'lr': 0.0004925727903545727, 'samples': 2594496, 'steps': 13512, 'loss/train': 1.662975788116455} +11/06/2021 23:06:51 - INFO - __main__ - Step 13514: {'lr': 0.0004925715063851157, 'samples': 2594688, 'steps': 13513, 'loss/train': 1.6688578128814697} +11/06/2021 23:06:52 - INFO - __main__ - Step 13515: {'lr': 0.0004925702223063597, 'samples': 2594880, 'steps': 13514, 'loss/train': 0.6073575019836426} +11/06/2021 23:06:52 - INFO - __main__ - Step 13516: {'lr': 0.0004925689381183052, 'samples': 2595072, 'steps': 13515, 'loss/train': 1.6856118440628052} +11/06/2021 23:06:52 - INFO - __main__ - Step 13517: {'lr': 0.0004925676538209531, 'samples': 2595264, 'steps': 13516, 'loss/train': 2.147181510925293} +11/06/2021 23:06:53 - INFO - __main__ - Step 13518: {'lr': 0.0004925663694143036, 'samples': 2595456, 'steps': 13517, 'loss/train': 1.5106788873672485} +11/06/2021 23:06:54 - INFO - __main__ - Step 13519: {'lr': 0.0004925650848983575, 'samples': 2595648, 'steps': 13518, 'loss/train': 1.8200280666351318} +11/06/2021 23:06:54 - INFO - __main__ - Step 13520: {'lr': 0.0004925638002731153, 'samples': 2595840, 'steps': 13519, 'loss/train': 1.5269951820373535} +11/06/2021 23:06:54 - INFO - __main__ - Step 13521: {'lr': 0.0004925625155385775, 'samples': 2596032, 'steps': 13520, 'loss/train': 1.926583170890808} +11/06/2021 23:06:55 - INFO - __main__ - Step 13522: {'lr': 0.0004925612306947449, 'samples': 2596224, 'steps': 13521, 'loss/train': 1.5432051420211792} +11/06/2021 23:06:56 - INFO - __main__ - Step 13523: {'lr': 0.0004925599457416179, 'samples': 2596416, 'steps': 13522, 'loss/train': 1.8082655668258667} +11/06/2021 23:06:56 - INFO - __main__ - Step 13524: {'lr': 0.0004925586606791972, 'samples': 2596608, 'steps': 13523, 'loss/train': 1.771362543106079} +11/06/2021 23:06:56 - INFO - __main__ - Step 13525: {'lr': 0.0004925573755074832, 'samples': 2596800, 'steps': 13524, 'loss/train': 1.9710201025009155} +11/06/2021 23:06:57 - INFO - __main__ - Step 13526: {'lr': 0.0004925560902264766, 'samples': 2596992, 'steps': 13525, 'loss/train': 1.8510551452636719} +11/06/2021 23:06:57 - INFO - __main__ - Step 13527: {'lr': 0.000492554804836178, 'samples': 2597184, 'steps': 13526, 'loss/train': 1.7917557954788208} +11/06/2021 23:06:59 - INFO - __main__ - Step 13528: {'lr': 0.000492553519336588, 'samples': 2597376, 'steps': 13527, 'loss/train': 1.3388181924819946} +11/06/2021 23:06:59 - INFO - __main__ - Step 13529: {'lr': 0.000492552233727707, 'samples': 2597568, 'steps': 13528, 'loss/train': 1.9206374883651733} +11/06/2021 23:07:00 - INFO - __main__ - Step 13530: {'lr': 0.0004925509480095358, 'samples': 2597760, 'steps': 13529, 'loss/train': 1.7673835754394531} +11/06/2021 23:07:00 - INFO - __main__ - Step 13531: {'lr': 0.0004925496621820749, 'samples': 2597952, 'steps': 13530, 'loss/train': 1.4747488498687744} +11/06/2021 23:07:00 - INFO - __main__ - Step 13532: {'lr': 0.0004925483762453249, 'samples': 2598144, 'steps': 13531, 'loss/train': 0.7193357944488525} +11/06/2021 23:07:01 - INFO - __main__ - Step 13533: {'lr': 0.0004925470901992863, 'samples': 2598336, 'steps': 13532, 'loss/train': 1.6905871629714966} +11/06/2021 23:07:02 - INFO - __main__ - Step 13534: {'lr': 0.0004925458040439596, 'samples': 2598528, 'steps': 13533, 'loss/train': 1.825111985206604} +11/06/2021 23:07:02 - INFO - __main__ - Step 13535: {'lr': 0.0004925445177793457, 'samples': 2598720, 'steps': 13534, 'loss/train': 1.879388689994812} +11/06/2021 23:07:02 - INFO - __main__ - Step 13536: {'lr': 0.0004925432314054448, 'samples': 2598912, 'steps': 13535, 'loss/train': 1.898144006729126} +11/06/2021 23:07:03 - INFO - __main__ - Step 13537: {'lr': 0.0004925419449222578, 'samples': 2599104, 'steps': 13536, 'loss/train': 2.1349470615386963} +11/06/2021 23:07:04 - INFO - __main__ - Step 13538: {'lr': 0.0004925406583297851, 'samples': 2599296, 'steps': 13537, 'loss/train': 1.8483484983444214} +11/06/2021 23:07:04 - INFO - __main__ - Step 13539: {'lr': 0.0004925393716280274, 'samples': 2599488, 'steps': 13538, 'loss/train': 1.1511164903640747} +11/06/2021 23:07:04 - INFO - __main__ - Step 13540: {'lr': 0.0004925380848169851, 'samples': 2599680, 'steps': 13539, 'loss/train': 1.4362045526504517} +11/06/2021 23:07:05 - INFO - __main__ - Step 13541: {'lr': 0.0004925367978966588, 'samples': 2599872, 'steps': 13540, 'loss/train': 2.184403419494629} +11/06/2021 23:07:05 - INFO - __main__ - Step 13542: {'lr': 0.0004925355108670493, 'samples': 2600064, 'steps': 13541, 'loss/train': 1.5568304061889648} +11/06/2021 23:07:06 - INFO - __main__ - Step 13543: {'lr': 0.0004925342237281571, 'samples': 2600256, 'steps': 13542, 'loss/train': 1.6341681480407715} +11/06/2021 23:07:06 - INFO - __main__ - Step 13544: {'lr': 0.0004925329364799825, 'samples': 2600448, 'steps': 13543, 'loss/train': 1.4727433919906616} +11/06/2021 23:07:07 - INFO - __main__ - Step 13545: {'lr': 0.0004925316491225265, 'samples': 2600640, 'steps': 13544, 'loss/train': 1.715566873550415} +11/06/2021 23:07:07 - INFO - __main__ - Step 13546: {'lr': 0.0004925303616557893, 'samples': 2600832, 'steps': 13545, 'loss/train': 1.6563913822174072} +11/06/2021 23:07:08 - INFO - __main__ - Step 13547: {'lr': 0.0004925290740797718, 'samples': 2601024, 'steps': 13546, 'loss/train': 1.9867644309997559} +11/06/2021 23:07:08 - INFO - __main__ - Step 13548: {'lr': 0.0004925277863944745, 'samples': 2601216, 'steps': 13547, 'loss/train': 2.0575523376464844} +11/06/2021 23:07:09 - INFO - __main__ - Step 13549: {'lr': 0.0004925264985998978, 'samples': 2601408, 'steps': 13548, 'loss/train': 1.7261626720428467} +11/06/2021 23:07:09 - INFO - __main__ - Step 13550: {'lr': 0.0004925252106960425, 'samples': 2601600, 'steps': 13549, 'loss/train': 1.596949577331543} +11/06/2021 23:07:10 - INFO - __main__ - Step 13551: {'lr': 0.000492523922682909, 'samples': 2601792, 'steps': 13550, 'loss/train': 1.3621716499328613} +11/06/2021 23:07:10 - INFO - __main__ - Step 13552: {'lr': 0.0004925226345604979, 'samples': 2601984, 'steps': 13551, 'loss/train': 1.458478569984436} +11/06/2021 23:07:10 - INFO - __main__ - Step 13553: {'lr': 0.0004925213463288099, 'samples': 2602176, 'steps': 13552, 'loss/train': 1.587988257408142} +11/06/2021 23:07:11 - INFO - __main__ - Step 13554: {'lr': 0.0004925200579878456, 'samples': 2602368, 'steps': 13553, 'loss/train': 1.3299733400344849} +11/06/2021 23:07:12 - INFO - __main__ - Step 13555: {'lr': 0.0004925187695376055, 'samples': 2602560, 'steps': 13554, 'loss/train': 1.4566415548324585} +11/06/2021 23:07:12 - INFO - __main__ - Step 13556: {'lr': 0.0004925174809780901, 'samples': 2602752, 'steps': 13555, 'loss/train': 1.6076452732086182} +11/06/2021 23:07:12 - INFO - __main__ - Step 13557: {'lr': 0.0004925161923093001, 'samples': 2602944, 'steps': 13556, 'loss/train': 1.5300875902175903} +11/06/2021 23:07:13 - INFO - __main__ - Step 13558: {'lr': 0.000492514903531236, 'samples': 2603136, 'steps': 13557, 'loss/train': 1.9013261795043945} +11/06/2021 23:07:14 - INFO - __main__ - Step 13559: {'lr': 0.0004925136146438986, 'samples': 2603328, 'steps': 13558, 'loss/train': 1.5588353872299194} +11/06/2021 23:07:14 - INFO - __main__ - Step 13560: {'lr': 0.0004925123256472881, 'samples': 2603520, 'steps': 13559, 'loss/train': 1.529636263847351} +11/06/2021 23:07:14 - INFO - __main__ - Step 13561: {'lr': 0.0004925110365414054, 'samples': 2603712, 'steps': 13560, 'loss/train': 1.6311484575271606} +11/06/2021 23:07:15 - INFO - __main__ - Step 13562: {'lr': 0.0004925097473262509, 'samples': 2603904, 'steps': 13561, 'loss/train': 1.773667573928833} +11/06/2021 23:07:15 - INFO - __main__ - Step 13563: {'lr': 0.0004925084580018253, 'samples': 2604096, 'steps': 13562, 'loss/train': 1.412859559059143} +11/06/2021 23:07:16 - INFO - __main__ - Step 13564: {'lr': 0.0004925071685681292, 'samples': 2604288, 'steps': 13563, 'loss/train': 2.0537023544311523} +11/06/2021 23:07:16 - INFO - __main__ - Step 13565: {'lr': 0.000492505879025163, 'samples': 2604480, 'steps': 13564, 'loss/train': 1.4484230279922485} +11/06/2021 23:07:17 - INFO - __main__ - Step 13566: {'lr': 0.0004925045893729274, 'samples': 2604672, 'steps': 13565, 'loss/train': 1.8159236907958984} +11/06/2021 23:07:17 - INFO - __main__ - Step 13567: {'lr': 0.000492503299611423, 'samples': 2604864, 'steps': 13566, 'loss/train': 1.2261930704116821} +11/06/2021 23:07:18 - INFO - __main__ - Step 13568: {'lr': 0.0004925020097406504, 'samples': 2605056, 'steps': 13567, 'loss/train': 1.8330031633377075} +11/06/2021 23:07:19 - INFO - __main__ - Step 13569: {'lr': 0.00049250071976061, 'samples': 2605248, 'steps': 13568, 'loss/train': 1.5868868827819824} +11/06/2021 23:07:19 - INFO - __main__ - Step 13570: {'lr': 0.0004924994296713026, 'samples': 2605440, 'steps': 13569, 'loss/train': 1.7566038370132446} +11/06/2021 23:07:19 - INFO - __main__ - Step 13571: {'lr': 0.0004924981394727288, 'samples': 2605632, 'steps': 13570, 'loss/train': 1.4361501932144165} +11/06/2021 23:07:20 - INFO - __main__ - Step 13572: {'lr': 0.0004924968491648889, 'samples': 2605824, 'steps': 13571, 'loss/train': 1.6027421951293945} +11/06/2021 23:07:20 - INFO - __main__ - Step 13573: {'lr': 0.0004924955587477837, 'samples': 2606016, 'steps': 13572, 'loss/train': 1.6203863620758057} +11/06/2021 23:07:21 - INFO - __main__ - Step 13574: {'lr': 0.0004924942682214138, 'samples': 2606208, 'steps': 13573, 'loss/train': 1.7938021421432495} +11/06/2021 23:07:21 - INFO - __main__ - Step 13575: {'lr': 0.0004924929775857798, 'samples': 2606400, 'steps': 13574, 'loss/train': 0.9622952938079834} +11/06/2021 23:07:22 - INFO - __main__ - Step 13576: {'lr': 0.0004924916868408821, 'samples': 2606592, 'steps': 13575, 'loss/train': 1.0422208309173584} +11/06/2021 23:07:22 - INFO - __main__ - Step 13577: {'lr': 0.0004924903959867214, 'samples': 2606784, 'steps': 13576, 'loss/train': 1.6397504806518555} +11/06/2021 23:07:22 - INFO - __main__ - Step 13578: {'lr': 0.0004924891050232984, 'samples': 2606976, 'steps': 13577, 'loss/train': 1.8606226444244385} +11/06/2021 23:07:23 - INFO - __main__ - Step 13579: {'lr': 0.0004924878139506134, 'samples': 2607168, 'steps': 13578, 'loss/train': 1.482366681098938} +11/06/2021 23:07:24 - INFO - __main__ - Step 13580: {'lr': 0.0004924865227686671, 'samples': 2607360, 'steps': 13579, 'loss/train': 1.4506975412368774} +11/06/2021 23:07:25 - INFO - __main__ - Step 13581: {'lr': 0.0004924852314774602, 'samples': 2607552, 'steps': 13580, 'loss/train': 2.16103196144104} +11/06/2021 23:07:25 - INFO - __main__ - Step 13582: {'lr': 0.0004924839400769932, 'samples': 2607744, 'steps': 13581, 'loss/train': 1.665818452835083} +11/06/2021 23:07:25 - INFO - __main__ - Step 13583: {'lr': 0.0004924826485672667, 'samples': 2607936, 'steps': 13582, 'loss/train': 0.9627843499183655} +11/06/2021 23:07:26 - INFO - __main__ - Step 13584: {'lr': 0.0004924813569482812, 'samples': 2608128, 'steps': 13583, 'loss/train': 1.1385881900787354} +11/06/2021 23:07:27 - INFO - __main__ - Step 13585: {'lr': 0.0004924800652200373, 'samples': 2608320, 'steps': 13584, 'loss/train': 1.7369372844696045} +11/06/2021 23:07:27 - INFO - __main__ - Step 13586: {'lr': 0.0004924787733825357, 'samples': 2608512, 'steps': 13585, 'loss/train': 2.386915922164917} +11/06/2021 23:07:27 - INFO - __main__ - Step 13587: {'lr': 0.0004924774814357768, 'samples': 2608704, 'steps': 13586, 'loss/train': 1.7782405614852905} +11/06/2021 23:07:28 - INFO - __main__ - Step 13588: {'lr': 0.0004924761893797615, 'samples': 2608896, 'steps': 13587, 'loss/train': 1.8888113498687744} +11/06/2021 23:07:28 - INFO - __main__ - Step 13589: {'lr': 0.00049247489721449, 'samples': 2609088, 'steps': 13588, 'loss/train': 5.811814785003662} +11/06/2021 23:07:29 - INFO - __main__ - Step 13590: {'lr': 0.0004924736049399631, 'samples': 2609280, 'steps': 13589, 'loss/train': 1.3031723499298096} +11/06/2021 23:07:29 - INFO - __main__ - Step 13591: {'lr': 0.0004924723125561813, 'samples': 2609472, 'steps': 13590, 'loss/train': 1.8062859773635864} +11/06/2021 23:07:30 - INFO - __main__ - Step 13592: {'lr': 0.0004924710200631453, 'samples': 2609664, 'steps': 13591, 'loss/train': 1.475710153579712} +11/06/2021 23:07:30 - INFO - __main__ - Step 13593: {'lr': 0.0004924697274608556, 'samples': 2609856, 'steps': 13592, 'loss/train': 1.6289951801300049} +11/06/2021 23:07:31 - INFO - __main__ - Step 13594: {'lr': 0.0004924684347493126, 'samples': 2610048, 'steps': 13593, 'loss/train': 1.741284966468811} +11/06/2021 23:07:32 - INFO - __main__ - Step 13595: {'lr': 0.0004924671419285172, 'samples': 2610240, 'steps': 13594, 'loss/train': 1.871199369430542} +11/06/2021 23:07:32 - INFO - __main__ - Step 13596: {'lr': 0.0004924658489984699, 'samples': 2610432, 'steps': 13595, 'loss/train': 1.5763531923294067} +11/06/2021 23:07:32 - INFO - __main__ - Step 13597: {'lr': 0.0004924645559591712, 'samples': 2610624, 'steps': 13596, 'loss/train': 1.8481301069259644} +11/06/2021 23:07:33 - INFO - __main__ - Step 13598: {'lr': 0.0004924632628106217, 'samples': 2610816, 'steps': 13597, 'loss/train': 1.9725139141082764} +11/06/2021 23:07:33 - INFO - __main__ - Step 13599: {'lr': 0.000492461969552822, 'samples': 2611008, 'steps': 13598, 'loss/train': 1.4551993608474731} +11/06/2021 23:07:33 - INFO - __main__ - Step 13600: {'lr': 0.0004924606761857726, 'samples': 2611200, 'steps': 13599, 'loss/train': 1.2987780570983887} +11/06/2021 23:07:34 - INFO - __main__ - Step 13601: {'lr': 0.0004924593827094744, 'samples': 2611392, 'steps': 13600, 'loss/train': 1.725089430809021} +11/06/2021 23:07:35 - INFO - __main__ - Step 13602: {'lr': 0.0004924580891239274, 'samples': 2611584, 'steps': 13601, 'loss/train': 1.9037177562713623} +11/06/2021 23:07:35 - INFO - __main__ - Step 13603: {'lr': 0.0004924567954291328, 'samples': 2611776, 'steps': 13602, 'loss/train': 1.6505497694015503} +11/06/2021 23:07:35 - INFO - __main__ - Step 13604: {'lr': 0.0004924555016250908, 'samples': 2611968, 'steps': 13603, 'loss/train': 1.9242398738861084} +11/06/2021 23:07:36 - INFO - __main__ - Step 13605: {'lr': 0.0004924542077118021, 'samples': 2612160, 'steps': 13604, 'loss/train': 1.6586657762527466} +11/06/2021 23:07:38 - INFO - __main__ - Step 13606: {'lr': 0.0004924529136892673, 'samples': 2612352, 'steps': 13605, 'loss/train': 1.6785545349121094} +11/06/2021 23:07:38 - INFO - __main__ - Step 13607: {'lr': 0.0004924516195574869, 'samples': 2612544, 'steps': 13606, 'loss/train': 0.57390958070755} +11/06/2021 23:07:39 - INFO - __main__ - Step 13608: {'lr': 0.0004924503253164614, 'samples': 2612736, 'steps': 13607, 'loss/train': 1.4627878665924072} +11/06/2021 23:07:39 - INFO - __main__ - Step 13609: {'lr': 0.0004924490309661918, 'samples': 2612928, 'steps': 13608, 'loss/train': 0.6431192755699158} +11/06/2021 23:07:39 - INFO - __main__ - Step 13610: {'lr': 0.0004924477365066783, 'samples': 2613120, 'steps': 13609, 'loss/train': 1.783947229385376} +11/06/2021 23:07:40 - INFO - __main__ - Step 13611: {'lr': 0.0004924464419379217, 'samples': 2613312, 'steps': 13610, 'loss/train': 1.6398215293884277} +11/06/2021 23:07:41 - INFO - __main__ - Step 13612: {'lr': 0.0004924451472599222, 'samples': 2613504, 'steps': 13611, 'loss/train': 0.23156870901584625} +11/06/2021 23:07:41 - INFO - __main__ - Step 13613: {'lr': 0.000492443852472681, 'samples': 2613696, 'steps': 13612, 'loss/train': 1.843045711517334} +11/06/2021 23:07:41 - INFO - __main__ - Step 13614: {'lr': 0.000492442557576198, 'samples': 2613888, 'steps': 13613, 'loss/train': 1.7973626852035522} +11/06/2021 23:07:42 - INFO - __main__ - Step 13615: {'lr': 0.0004924412625704744, 'samples': 2614080, 'steps': 13614, 'loss/train': 2.342195749282837} +11/06/2021 23:07:42 - INFO - __main__ - Step 13616: {'lr': 0.0004924399674555103, 'samples': 2614272, 'steps': 13615, 'loss/train': 1.5847399234771729} +11/06/2021 23:07:42 - INFO - __main__ - Step 13617: {'lr': 0.0004924386722313066, 'samples': 2614464, 'steps': 13616, 'loss/train': 1.906503438949585} +11/06/2021 23:07:43 - INFO - __main__ - Step 13618: {'lr': 0.0004924373768978638, 'samples': 2614656, 'steps': 13617, 'loss/train': 2.0704801082611084} +11/06/2021 23:07:44 - INFO - __main__ - Step 13619: {'lr': 0.0004924360814551825, 'samples': 2614848, 'steps': 13618, 'loss/train': 1.9433788061141968} +11/06/2021 23:07:44 - INFO - __main__ - Step 13620: {'lr': 0.0004924347859032631, 'samples': 2615040, 'steps': 13619, 'loss/train': 1.7289719581604004} +11/06/2021 23:07:44 - INFO - __main__ - Step 13621: {'lr': 0.0004924334902421065, 'samples': 2615232, 'steps': 13620, 'loss/train': 2.022456407546997} +11/06/2021 23:07:45 - INFO - __main__ - Step 13622: {'lr': 0.0004924321944717129, 'samples': 2615424, 'steps': 13621, 'loss/train': 1.9337289333343506} +11/06/2021 23:07:46 - INFO - __main__ - Step 13623: {'lr': 0.0004924308985920832, 'samples': 2615616, 'steps': 13622, 'loss/train': 2.2961039543151855} +11/06/2021 23:07:46 - INFO - __main__ - Step 13624: {'lr': 0.0004924296026032179, 'samples': 2615808, 'steps': 13623, 'loss/train': 1.2842239141464233} +11/06/2021 23:07:46 - INFO - __main__ - Step 13625: {'lr': 0.0004924283065051176, 'samples': 2616000, 'steps': 13624, 'loss/train': 1.8332487344741821} +11/06/2021 23:07:47 - INFO - __main__ - Step 13626: {'lr': 0.0004924270102977827, 'samples': 2616192, 'steps': 13625, 'loss/train': 2.1077988147735596} +11/06/2021 23:07:47 - INFO - __main__ - Step 13627: {'lr': 0.0004924257139812141, 'samples': 2616384, 'steps': 13626, 'loss/train': 1.8396973609924316} +11/06/2021 23:07:49 - INFO - __main__ - Step 13628: {'lr': 0.0004924244175554121, 'samples': 2616576, 'steps': 13627, 'loss/train': 1.9551353454589844} +11/06/2021 23:07:49 - INFO - __main__ - Step 13629: {'lr': 0.0004924231210203775, 'samples': 2616768, 'steps': 13628, 'loss/train': 1.9722517728805542} +11/06/2021 23:07:49 - INFO - __main__ - Step 13630: {'lr': 0.0004924218243761106, 'samples': 2616960, 'steps': 13629, 'loss/train': 1.3070924282073975} +11/06/2021 23:07:50 - INFO - __main__ - Step 13631: {'lr': 0.0004924205276226123, 'samples': 2617152, 'steps': 13630, 'loss/train': 1.8307408094406128} +11/06/2021 23:07:50 - INFO - __main__ - Step 13632: {'lr': 0.000492419230759883, 'samples': 2617344, 'steps': 13631, 'loss/train': 1.8106156587600708} +11/06/2021 23:07:50 - INFO - __main__ - Step 13633: {'lr': 0.0004924179337879234, 'samples': 2617536, 'steps': 13632, 'loss/train': 1.3615984916687012} +11/06/2021 23:07:51 - INFO - __main__ - Step 13634: {'lr': 0.000492416636706734, 'samples': 2617728, 'steps': 13633, 'loss/train': 1.84334397315979} +11/06/2021 23:07:52 - INFO - __main__ - Step 13635: {'lr': 0.0004924153395163153, 'samples': 2617920, 'steps': 13634, 'loss/train': 1.8057781457901} +11/06/2021 23:07:52 - INFO - __main__ - Step 13636: {'lr': 0.0004924140422166681, 'samples': 2618112, 'steps': 13635, 'loss/train': 1.1118844747543335} +11/06/2021 23:07:52 - INFO - __main__ - Step 13637: {'lr': 0.0004924127448077929, 'samples': 2618304, 'steps': 13636, 'loss/train': 1.283229112625122} +11/06/2021 23:07:53 - INFO - __main__ - Step 13638: {'lr': 0.0004924114472896902, 'samples': 2618496, 'steps': 13637, 'loss/train': 1.547655701637268} +11/06/2021 23:07:54 - INFO - __main__ - Step 13639: {'lr': 0.0004924101496623606, 'samples': 2618688, 'steps': 13638, 'loss/train': 1.6274465322494507} +11/06/2021 23:07:54 - INFO - __main__ - Step 13640: {'lr': 0.0004924088519258049, 'samples': 2618880, 'steps': 13639, 'loss/train': 1.567894697189331} +11/06/2021 23:07:55 - INFO - __main__ - Step 13641: {'lr': 0.0004924075540800233, 'samples': 2619072, 'steps': 13640, 'loss/train': 1.5722965002059937} +11/06/2021 23:07:55 - INFO - __main__ - Step 13642: {'lr': 0.0004924062561250167, 'samples': 2619264, 'steps': 13641, 'loss/train': 1.4436631202697754} +11/06/2021 23:07:55 - INFO - __main__ - Step 13643: {'lr': 0.0004924049580607855, 'samples': 2619456, 'steps': 13642, 'loss/train': 1.4802452325820923} +11/06/2021 23:07:56 - INFO - __main__ - Step 13644: {'lr': 0.0004924036598873305, 'samples': 2619648, 'steps': 13643, 'loss/train': 1.4207649230957031} +11/06/2021 23:07:57 - INFO - __main__ - Step 13645: {'lr': 0.0004924023616046521, 'samples': 2619840, 'steps': 13644, 'loss/train': 0.14849276840686798} +11/06/2021 23:07:57 - INFO - __main__ - Step 13646: {'lr': 0.000492401063212751, 'samples': 2620032, 'steps': 13645, 'loss/train': 1.5605554580688477} +11/06/2021 23:07:57 - INFO - __main__ - Step 13647: {'lr': 0.0004923997647116276, 'samples': 2620224, 'steps': 13646, 'loss/train': 0.61855548620224} +11/06/2021 23:07:58 - INFO - __main__ - Step 13648: {'lr': 0.0004923984661012827, 'samples': 2620416, 'steps': 13647, 'loss/train': 1.0472122430801392} +11/06/2021 23:07:58 - INFO - __main__ - Step 13649: {'lr': 0.0004923971673817167, 'samples': 2620608, 'steps': 13648, 'loss/train': 2.2823336124420166} +11/06/2021 23:07:59 - INFO - __main__ - Step 13650: {'lr': 0.0004923958685529303, 'samples': 2620800, 'steps': 13649, 'loss/train': 1.8961249589920044} +11/06/2021 23:07:59 - INFO - __main__ - Step 13651: {'lr': 0.0004923945696149241, 'samples': 2620992, 'steps': 13650, 'loss/train': 1.9037821292877197} +11/06/2021 23:08:00 - INFO - __main__ - Step 13652: {'lr': 0.0004923932705676986, 'samples': 2621184, 'steps': 13651, 'loss/train': 1.549149990081787} +11/06/2021 23:08:00 - INFO - __main__ - Step 13653: {'lr': 0.0004923919714112545, 'samples': 2621376, 'steps': 13652, 'loss/train': 1.5010502338409424} +11/06/2021 23:08:01 - INFO - __main__ - Step 13654: {'lr': 0.0004923906721455922, 'samples': 2621568, 'steps': 13653, 'loss/train': 1.2696095705032349} +11/06/2021 23:08:01 - INFO - __main__ - Step 13655: {'lr': 0.0004923893727707125, 'samples': 2621760, 'steps': 13654, 'loss/train': 2.0763657093048096} +11/06/2021 23:08:02 - INFO - __main__ - Step 13656: {'lr': 0.0004923880732866159, 'samples': 2621952, 'steps': 13655, 'loss/train': 1.3228414058685303} +11/06/2021 23:08:02 - INFO - __main__ - Step 13657: {'lr': 0.0004923867736933029, 'samples': 2622144, 'steps': 13656, 'loss/train': 1.621604323387146} +11/06/2021 23:08:02 - INFO - __main__ - Step 13658: {'lr': 0.0004923854739907743, 'samples': 2622336, 'steps': 13657, 'loss/train': 1.2240080833435059} +11/06/2021 23:08:03 - INFO - __main__ - Step 13659: {'lr': 0.0004923841741790304, 'samples': 2622528, 'steps': 13658, 'loss/train': 1.7025880813598633} +11/06/2021 23:08:04 - INFO - __main__ - Step 13660: {'lr': 0.0004923828742580719, 'samples': 2622720, 'steps': 13659, 'loss/train': 0.8166983723640442} +11/06/2021 23:08:04 - INFO - __main__ - Step 13661: {'lr': 0.0004923815742278996, 'samples': 2622912, 'steps': 13660, 'loss/train': 1.8481582403182983} +11/06/2021 23:08:05 - INFO - __main__ - Step 13662: {'lr': 0.0004923802740885139, 'samples': 2623104, 'steps': 13661, 'loss/train': 1.9549199342727661} +11/06/2021 23:08:05 - INFO - __main__ - Step 13663: {'lr': 0.0004923789738399152, 'samples': 2623296, 'steps': 13662, 'loss/train': 1.5047688484191895} +11/06/2021 23:08:05 - INFO - __main__ - Step 13664: {'lr': 0.0004923776734821044, 'samples': 2623488, 'steps': 13663, 'loss/train': 1.784568190574646} +11/06/2021 23:08:07 - INFO - __main__ - Step 13665: {'lr': 0.0004923763730150819, 'samples': 2623680, 'steps': 13664, 'loss/train': 1.6027264595031738} +11/06/2021 23:08:07 - INFO - __main__ - Step 13666: {'lr': 0.0004923750724388483, 'samples': 2623872, 'steps': 13665, 'loss/train': 1.826322078704834} +11/06/2021 23:08:07 - INFO - __main__ - Step 13667: {'lr': 0.0004923737717534044, 'samples': 2624064, 'steps': 13666, 'loss/train': 1.9176068305969238} +11/06/2021 23:08:08 - INFO - __main__ - Step 13668: {'lr': 0.0004923724709587504, 'samples': 2624256, 'steps': 13667, 'loss/train': 2.2338030338287354} +11/06/2021 23:08:08 - INFO - __main__ - Step 13669: {'lr': 0.0004923711700548873, 'samples': 2624448, 'steps': 13668, 'loss/train': 1.8430683612823486} +11/06/2021 23:08:09 - INFO - __main__ - Step 13670: {'lr': 0.0004923698690418154, 'samples': 2624640, 'steps': 13669, 'loss/train': 0.9396169781684875} +11/06/2021 23:08:09 - INFO - __main__ - Step 13671: {'lr': 0.0004923685679195355, 'samples': 2624832, 'steps': 13670, 'loss/train': 1.6337071657180786} +11/06/2021 23:08:10 - INFO - __main__ - Step 13672: {'lr': 0.0004923672666880479, 'samples': 2625024, 'steps': 13671, 'loss/train': 1.3676971197128296} +11/06/2021 23:08:10 - INFO - __main__ - Step 13673: {'lr': 0.0004923659653473533, 'samples': 2625216, 'steps': 13672, 'loss/train': 1.6104556322097778} +11/06/2021 23:08:10 - INFO - __main__ - Step 13674: {'lr': 0.0004923646638974524, 'samples': 2625408, 'steps': 13673, 'loss/train': 1.3942358493804932} +11/06/2021 23:08:11 - INFO - __main__ - Step 13675: {'lr': 0.0004923633623383459, 'samples': 2625600, 'steps': 13674, 'loss/train': 1.8581507205963135} +11/06/2021 23:08:12 - INFO - __main__ - Step 13676: {'lr': 0.0004923620606700341, 'samples': 2625792, 'steps': 13675, 'loss/train': 1.0747668743133545} +11/06/2021 23:08:12 - INFO - __main__ - Step 13677: {'lr': 0.0004923607588925177, 'samples': 2625984, 'steps': 13676, 'loss/train': 1.7954381704330444} +11/06/2021 23:08:13 - INFO - __main__ - Step 13678: {'lr': 0.0004923594570057972, 'samples': 2626176, 'steps': 13677, 'loss/train': 1.8228819370269775} +11/06/2021 23:08:13 - INFO - __main__ - Step 13679: {'lr': 0.0004923581550098733, 'samples': 2626368, 'steps': 13678, 'loss/train': 1.6954731941223145} +11/06/2021 23:08:13 - INFO - __main__ - Step 13680: {'lr': 0.0004923568529047466, 'samples': 2626560, 'steps': 13679, 'loss/train': 1.7315030097961426} +11/06/2021 23:08:14 - INFO - __main__ - Step 13681: {'lr': 0.0004923555506904176, 'samples': 2626752, 'steps': 13680, 'loss/train': 1.701892614364624} +11/06/2021 23:08:15 - INFO - __main__ - Step 13682: {'lr': 0.0004923542483668869, 'samples': 2626944, 'steps': 13681, 'loss/train': 1.860314130783081} +11/06/2021 23:08:15 - INFO - __main__ - Step 13683: {'lr': 0.0004923529459341553, 'samples': 2627136, 'steps': 13682, 'loss/train': 1.5771002769470215} +11/06/2021 23:08:15 - INFO - __main__ - Step 13684: {'lr': 0.000492351643392223, 'samples': 2627328, 'steps': 13683, 'loss/train': 2.214824914932251} +11/06/2021 23:08:16 - INFO - __main__ - Step 13685: {'lr': 0.0004923503407410908, 'samples': 2627520, 'steps': 13684, 'loss/train': 1.6392228603363037} +11/06/2021 23:08:17 - INFO - __main__ - Step 13686: {'lr': 0.0004923490379807594, 'samples': 2627712, 'steps': 13685, 'loss/train': 1.5940680503845215} +11/06/2021 23:08:17 - INFO - __main__ - Step 13687: {'lr': 0.0004923477351112291, 'samples': 2627904, 'steps': 13686, 'loss/train': 1.3699396848678589} +11/06/2021 23:08:17 - INFO - __main__ - Step 13688: {'lr': 0.0004923464321325008, 'samples': 2628096, 'steps': 13687, 'loss/train': 2.2057156562805176} +11/06/2021 23:08:18 - INFO - __main__ - Step 13689: {'lr': 0.0004923451290445749, 'samples': 2628288, 'steps': 13688, 'loss/train': 1.5960655212402344} +11/06/2021 23:08:18 - INFO - __main__ - Step 13690: {'lr': 0.000492343825847452, 'samples': 2628480, 'steps': 13689, 'loss/train': 2.2023274898529053} +11/06/2021 23:08:19 - INFO - __main__ - Step 13691: {'lr': 0.0004923425225411328, 'samples': 2628672, 'steps': 13690, 'loss/train': 1.8006644248962402} +11/06/2021 23:08:19 - INFO - __main__ - Step 13692: {'lr': 0.0004923412191256176, 'samples': 2628864, 'steps': 13691, 'loss/train': 1.6855508089065552} +11/06/2021 23:08:20 - INFO - __main__ - Step 13693: {'lr': 0.0004923399156009073, 'samples': 2629056, 'steps': 13692, 'loss/train': 1.91086745262146} +11/06/2021 23:08:20 - INFO - __main__ - Step 13694: {'lr': 0.0004923386119670024, 'samples': 2629248, 'steps': 13693, 'loss/train': 2.243964910507202} +11/06/2021 23:08:20 - INFO - __main__ - Step 13695: {'lr': 0.0004923373082239035, 'samples': 2629440, 'steps': 13694, 'loss/train': 1.8091576099395752} +11/06/2021 23:08:21 - INFO - __main__ - Step 13696: {'lr': 0.000492336004371611, 'samples': 2629632, 'steps': 13695, 'loss/train': 1.891566276550293} +11/06/2021 23:08:22 - INFO - __main__ - Step 13697: {'lr': 0.0004923347004101257, 'samples': 2629824, 'steps': 13696, 'loss/train': 1.8870787620544434} +11/06/2021 23:08:22 - INFO - __main__ - Step 13698: {'lr': 0.0004923333963394482, 'samples': 2630016, 'steps': 13697, 'loss/train': 1.609986424446106} +11/06/2021 23:08:22 - INFO - __main__ - Step 13699: {'lr': 0.000492332092159579, 'samples': 2630208, 'steps': 13698, 'loss/train': 1.5685456991195679} +11/06/2021 23:08:23 - INFO - __main__ - Step 13700: {'lr': 0.0004923307878705186, 'samples': 2630400, 'steps': 13699, 'loss/train': 1.4887804985046387} +11/06/2021 23:08:24 - INFO - __main__ - Step 13701: {'lr': 0.0004923294834722678, 'samples': 2630592, 'steps': 13700, 'loss/train': 1.6135252714157104} +11/06/2021 23:08:24 - INFO - __main__ - Step 13702: {'lr': 0.000492328178964827, 'samples': 2630784, 'steps': 13701, 'loss/train': 1.7054436206817627} +11/06/2021 23:08:25 - INFO - __main__ - Step 13703: {'lr': 0.0004923268743481969, 'samples': 2630976, 'steps': 13702, 'loss/train': 1.3338326215744019} +11/06/2021 23:08:25 - INFO - __main__ - Step 13704: {'lr': 0.000492325569622378, 'samples': 2631168, 'steps': 13703, 'loss/train': 1.5167887210845947} +11/06/2021 23:08:25 - INFO - __main__ - Step 13705: {'lr': 0.0004923242647873709, 'samples': 2631360, 'steps': 13704, 'loss/train': 1.7764374017715454} +11/06/2021 23:08:27 - INFO - __main__ - Step 13706: {'lr': 0.0004923229598431763, 'samples': 2631552, 'steps': 13705, 'loss/train': 1.981156349182129} +11/06/2021 23:08:27 - INFO - __main__ - Step 13707: {'lr': 0.0004923216547897948, 'samples': 2631744, 'steps': 13706, 'loss/train': 1.6128805875778198} +11/06/2021 23:08:27 - INFO - __main__ - Step 13708: {'lr': 0.0004923203496272267, 'samples': 2631936, 'steps': 13707, 'loss/train': 1.7675461769104004} +11/06/2021 23:08:28 - INFO - __main__ - Step 13709: {'lr': 0.0004923190443554729, 'samples': 2632128, 'steps': 13708, 'loss/train': 1.66963529586792} +11/06/2021 23:08:28 - INFO - __main__ - Step 13710: {'lr': 0.0004923177389745339, 'samples': 2632320, 'steps': 13709, 'loss/train': 0.4389937222003937} +11/06/2021 23:08:29 - INFO - __main__ - Step 13711: {'lr': 0.0004923164334844103, 'samples': 2632512, 'steps': 13710, 'loss/train': 1.7726091146469116} +11/06/2021 23:08:29 - INFO - __main__ - Step 13712: {'lr': 0.0004923151278851025, 'samples': 2632704, 'steps': 13711, 'loss/train': 0.9735046029090881} +11/06/2021 23:08:30 - INFO - __main__ - Step 13713: {'lr': 0.0004923138221766114, 'samples': 2632896, 'steps': 13712, 'loss/train': 1.4027715921401978} +11/06/2021 23:08:30 - INFO - __main__ - Step 13714: {'lr': 0.0004923125163589373, 'samples': 2633088, 'steps': 13713, 'loss/train': 1.875281572341919} +11/06/2021 23:08:30 - INFO - __main__ - Step 13715: {'lr': 0.0004923112104320811, 'samples': 2633280, 'steps': 13714, 'loss/train': 1.6900665760040283} +11/06/2021 23:08:32 - INFO - __main__ - Step 13716: {'lr': 0.000492309904396043, 'samples': 2633472, 'steps': 13715, 'loss/train': 1.1452865600585938} +11/06/2021 23:08:32 - INFO - __main__ - Step 13717: {'lr': 0.0004923085982508239, 'samples': 2633664, 'steps': 13716, 'loss/train': 1.9100697040557861} +11/06/2021 23:08:32 - INFO - __main__ - Step 13718: {'lr': 0.0004923072919964243, 'samples': 2633856, 'steps': 13717, 'loss/train': 4.524446964263916} +11/06/2021 23:08:33 - INFO - __main__ - Step 13719: {'lr': 0.0004923059856328447, 'samples': 2634048, 'steps': 13718, 'loss/train': 1.5310945510864258} +11/06/2021 23:08:33 - INFO - __main__ - Step 13720: {'lr': 0.0004923046791600859, 'samples': 2634240, 'steps': 13719, 'loss/train': 1.5483694076538086} +11/06/2021 23:08:34 - INFO - __main__ - Step 13721: {'lr': 0.0004923033725781482, 'samples': 2634432, 'steps': 13720, 'loss/train': 1.6037310361862183} +11/06/2021 23:08:34 - INFO - __main__ - Step 13722: {'lr': 0.0004923020658870324, 'samples': 2634624, 'steps': 13721, 'loss/train': 1.3916311264038086} +11/06/2021 23:08:35 - INFO - __main__ - Step 13723: {'lr': 0.000492300759086739, 'samples': 2634816, 'steps': 13722, 'loss/train': 0.19058111310005188} +11/06/2021 23:08:35 - INFO - __main__ - Step 13724: {'lr': 0.0004922994521772687, 'samples': 2635008, 'steps': 13723, 'loss/train': 1.856695532798767} +11/06/2021 23:08:35 - INFO - __main__ - Step 13725: {'lr': 0.000492298145158622, 'samples': 2635200, 'steps': 13724, 'loss/train': 1.6110961437225342} +11/06/2021 23:08:36 - INFO - __main__ - Step 13726: {'lr': 0.0004922968380307994, 'samples': 2635392, 'steps': 13725, 'loss/train': 2.1884765625} +11/06/2021 23:08:37 - INFO - __main__ - Step 13727: {'lr': 0.0004922955307938016, 'samples': 2635584, 'steps': 13726, 'loss/train': 1.4792718887329102} +11/06/2021 23:08:37 - INFO - __main__ - Step 13728: {'lr': 0.0004922942234476292, 'samples': 2635776, 'steps': 13727, 'loss/train': 0.9615477323532104} +11/06/2021 23:08:38 - INFO - __main__ - Step 13729: {'lr': 0.0004922929159922828, 'samples': 2635968, 'steps': 13728, 'loss/train': 1.467282772064209} +11/06/2021 23:08:38 - INFO - __main__ - Step 13730: {'lr': 0.0004922916084277629, 'samples': 2636160, 'steps': 13729, 'loss/train': 1.4172507524490356} +11/06/2021 23:08:38 - INFO - __main__ - Step 13731: {'lr': 0.0004922903007540701, 'samples': 2636352, 'steps': 13730, 'loss/train': 1.9334453344345093} +11/06/2021 23:08:40 - INFO - __main__ - Step 13732: {'lr': 0.0004922889929712051, 'samples': 2636544, 'steps': 13731, 'loss/train': 1.7975131273269653} +11/06/2021 23:08:40 - INFO - __main__ - Step 13733: {'lr': 0.0004922876850791684, 'samples': 2636736, 'steps': 13732, 'loss/train': 1.5812453031539917} +11/06/2021 23:08:40 - INFO - __main__ - Step 13734: {'lr': 0.0004922863770779606, 'samples': 2636928, 'steps': 13733, 'loss/train': 1.761626124382019} +11/06/2021 23:08:41 - INFO - __main__ - Step 13735: {'lr': 0.0004922850689675823, 'samples': 2637120, 'steps': 13734, 'loss/train': 0.9880645275115967} +11/06/2021 23:08:41 - INFO - __main__ - Step 13736: {'lr': 0.0004922837607480341, 'samples': 2637312, 'steps': 13735, 'loss/train': 1.812021255493164} +11/06/2021 23:08:41 - INFO - __main__ - Step 13737: {'lr': 0.0004922824524193166, 'samples': 2637504, 'steps': 13736, 'loss/train': 1.655940055847168} +11/06/2021 23:08:42 - INFO - __main__ - Step 13738: {'lr': 0.0004922811439814303, 'samples': 2637696, 'steps': 13737, 'loss/train': 3.0965065956115723} +11/06/2021 23:08:43 - INFO - __main__ - Step 13739: {'lr': 0.0004922798354343758, 'samples': 2637888, 'steps': 13738, 'loss/train': 1.1980981826782227} +11/06/2021 23:08:43 - INFO - __main__ - Step 13740: {'lr': 0.0004922785267781539, 'samples': 2638080, 'steps': 13739, 'loss/train': 1.4556937217712402} +11/06/2021 23:08:43 - INFO - __main__ - Step 13741: {'lr': 0.000492277218012765, 'samples': 2638272, 'steps': 13740, 'loss/train': 1.6142842769622803} +11/06/2021 23:08:44 - INFO - __main__ - Step 13742: {'lr': 0.0004922759091382097, 'samples': 2638464, 'steps': 13741, 'loss/train': 2.2603096961975098} +11/06/2021 23:08:45 - INFO - __main__ - Step 13743: {'lr': 0.0004922746001544885, 'samples': 2638656, 'steps': 13742, 'loss/train': 1.3596349954605103} +11/06/2021 23:08:45 - INFO - __main__ - Step 13744: {'lr': 0.0004922732910616023, 'samples': 2638848, 'steps': 13743, 'loss/train': 1.9842960834503174} +11/06/2021 23:08:46 - INFO - __main__ - Step 13745: {'lr': 0.0004922719818595514, 'samples': 2639040, 'steps': 13744, 'loss/train': 2.0623526573181152} +11/06/2021 23:08:46 - INFO - __main__ - Step 13746: {'lr': 0.0004922706725483364, 'samples': 2639232, 'steps': 13745, 'loss/train': 1.9149062633514404} +11/06/2021 23:08:46 - INFO - __main__ - Step 13747: {'lr': 0.0004922693631279581, 'samples': 2639424, 'steps': 13746, 'loss/train': 2.0381317138671875} +11/06/2021 23:08:47 - INFO - __main__ - Step 13748: {'lr': 0.000492268053598417, 'samples': 2639616, 'steps': 13747, 'loss/train': 2.627610445022583} +11/06/2021 23:08:48 - INFO - __main__ - Step 13749: {'lr': 0.0004922667439597136, 'samples': 2639808, 'steps': 13748, 'loss/train': 1.306639552116394} +11/06/2021 23:08:48 - INFO - __main__ - Step 13750: {'lr': 0.0004922654342118484, 'samples': 2640000, 'steps': 13749, 'loss/train': 1.3434464931488037} +11/06/2021 23:08:48 - INFO - __main__ - Step 13751: {'lr': 0.0004922641243548223, 'samples': 2640192, 'steps': 13750, 'loss/train': 2.0326554775238037} +11/06/2021 23:08:49 - INFO - __main__ - Step 13752: {'lr': 0.0004922628143886358, 'samples': 2640384, 'steps': 13751, 'loss/train': 2.049717903137207} +11/06/2021 23:08:49 - INFO - __main__ - Step 13753: {'lr': 0.0004922615043132892, 'samples': 2640576, 'steps': 13752, 'loss/train': 1.6888577938079834} +11/06/2021 23:08:50 - INFO - __main__ - Step 13754: {'lr': 0.0004922601941287835, 'samples': 2640768, 'steps': 13753, 'loss/train': 0.9408217668533325} +11/06/2021 23:08:50 - INFO - __main__ - Step 13755: {'lr': 0.0004922588838351189, 'samples': 2640960, 'steps': 13754, 'loss/train': 1.6507468223571777} +11/06/2021 23:08:51 - INFO - __main__ - Step 13756: {'lr': 0.0004922575734322963, 'samples': 2641152, 'steps': 13755, 'loss/train': 1.7679812908172607} +11/06/2021 23:08:51 - INFO - __main__ - Step 13757: {'lr': 0.0004922562629203161, 'samples': 2641344, 'steps': 13756, 'loss/train': 1.271485447883606} +11/06/2021 23:08:51 - INFO - __main__ - Step 13758: {'lr': 0.0004922549522991791, 'samples': 2641536, 'steps': 13757, 'loss/train': 1.955517053604126} +11/06/2021 23:08:53 - INFO - __main__ - Step 13759: {'lr': 0.0004922536415688856, 'samples': 2641728, 'steps': 13758, 'loss/train': 2.06683349609375} +11/06/2021 23:08:53 - INFO - __main__ - Step 13760: {'lr': 0.0004922523307294364, 'samples': 2641920, 'steps': 13759, 'loss/train': 1.354589581489563} +11/06/2021 23:08:53 - INFO - __main__ - Step 13761: {'lr': 0.0004922510197808321, 'samples': 2642112, 'steps': 13760, 'loss/train': 1.9096133708953857} +11/06/2021 23:08:54 - INFO - __main__ - Step 13762: {'lr': 0.0004922497087230732, 'samples': 2642304, 'steps': 13761, 'loss/train': 1.9483925104141235} +11/06/2021 23:08:54 - INFO - __main__ - Step 13763: {'lr': 0.0004922483975561603, 'samples': 2642496, 'steps': 13762, 'loss/train': 2.073777437210083} +11/06/2021 23:08:55 - INFO - __main__ - Step 13764: {'lr': 0.000492247086280094, 'samples': 2642688, 'steps': 13763, 'loss/train': 1.6551817655563354} +11/06/2021 23:08:55 - INFO - __main__ - Step 13765: {'lr': 0.0004922457748948749, 'samples': 2642880, 'steps': 13764, 'loss/train': 1.7662451267242432} +11/06/2021 23:08:56 - INFO - __main__ - Step 13766: {'lr': 0.0004922444634005037, 'samples': 2643072, 'steps': 13765, 'loss/train': 1.595479965209961} +11/06/2021 23:08:56 - INFO - __main__ - Step 13767: {'lr': 0.0004922431517969808, 'samples': 2643264, 'steps': 13766, 'loss/train': 1.6051268577575684} +11/06/2021 23:08:57 - INFO - __main__ - Step 13768: {'lr': 0.0004922418400843068, 'samples': 2643456, 'steps': 13767, 'loss/train': 0.942782461643219} +11/06/2021 23:08:58 - INFO - __main__ - Step 13769: {'lr': 0.0004922405282624825, 'samples': 2643648, 'steps': 13768, 'loss/train': 0.8302810788154602} +11/06/2021 23:08:58 - INFO - __main__ - Step 13770: {'lr': 0.0004922392163315083, 'samples': 2643840, 'steps': 13769, 'loss/train': 2.0029447078704834} +11/06/2021 23:08:58 - INFO - __main__ - Step 13771: {'lr': 0.0004922379042913848, 'samples': 2644032, 'steps': 13770, 'loss/train': 1.7818113565444946} +11/06/2021 23:08:59 - INFO - __main__ - Step 13772: {'lr': 0.0004922365921421126, 'samples': 2644224, 'steps': 13771, 'loss/train': 2.0600786209106445} +11/06/2021 23:08:59 - INFO - __main__ - Step 13773: {'lr': 0.0004922352798836924, 'samples': 2644416, 'steps': 13772, 'loss/train': 2.0496914386749268} +11/06/2021 23:09:00 - INFO - __main__ - Step 13774: {'lr': 0.0004922339675161248, 'samples': 2644608, 'steps': 13773, 'loss/train': 1.9038617610931396} +11/06/2021 23:09:00 - INFO - __main__ - Step 13775: {'lr': 0.0004922326550394102, 'samples': 2644800, 'steps': 13774, 'loss/train': 1.3252359628677368} +11/06/2021 23:09:01 - INFO - __main__ - Step 13776: {'lr': 0.0004922313424535494, 'samples': 2644992, 'steps': 13775, 'loss/train': 1.8318666219711304} +11/06/2021 23:09:01 - INFO - __main__ - Step 13777: {'lr': 0.0004922300297585428, 'samples': 2645184, 'steps': 13776, 'loss/train': 2.127047061920166} +11/06/2021 23:09:01 - INFO - __main__ - Step 13778: {'lr': 0.0004922287169543911, 'samples': 2645376, 'steps': 13777, 'loss/train': 1.2675795555114746} +11/06/2021 23:09:02 - INFO - __main__ - Step 13779: {'lr': 0.0004922274040410949, 'samples': 2645568, 'steps': 13778, 'loss/train': 1.7878961563110352} +11/06/2021 23:09:03 - INFO - __main__ - Step 13780: {'lr': 0.0004922260910186548, 'samples': 2645760, 'steps': 13779, 'loss/train': 1.97649085521698} +11/06/2021 23:09:03 - INFO - __main__ - Step 13781: {'lr': 0.0004922247778870714, 'samples': 2645952, 'steps': 13780, 'loss/train': 1.6250098943710327} +11/06/2021 23:09:04 - INFO - __main__ - Step 13782: {'lr': 0.0004922234646463451, 'samples': 2646144, 'steps': 13781, 'loss/train': 1.9466784000396729} +11/06/2021 23:09:04 - INFO - __main__ - Step 13783: {'lr': 0.0004922221512964767, 'samples': 2646336, 'steps': 13782, 'loss/train': 1.1106783151626587} +11/06/2021 23:09:04 - INFO - __main__ - Step 13784: {'lr': 0.0004922208378374668, 'samples': 2646528, 'steps': 13783, 'loss/train': 2.0252909660339355} +11/06/2021 23:09:05 - INFO - __main__ - Step 13785: {'lr': 0.0004922195242693159, 'samples': 2646720, 'steps': 13784, 'loss/train': 1.6497094631195068} +11/06/2021 23:09:06 - INFO - __main__ - Step 13786: {'lr': 0.0004922182105920246, 'samples': 2646912, 'steps': 13785, 'loss/train': 1.4474611282348633} +11/06/2021 23:09:06 - INFO - __main__ - Step 13787: {'lr': 0.0004922168968055935, 'samples': 2647104, 'steps': 13786, 'loss/train': 2.291621446609497} +11/06/2021 23:09:06 - INFO - __main__ - Step 13788: {'lr': 0.0004922155829100233, 'samples': 2647296, 'steps': 13787, 'loss/train': 2.148526668548584} +11/06/2021 23:09:07 - INFO - __main__ - Step 13789: {'lr': 0.0004922142689053144, 'samples': 2647488, 'steps': 13788, 'loss/train': 1.9192496538162231} +11/06/2021 23:09:08 - INFO - __main__ - Step 13790: {'lr': 0.0004922129547914675, 'samples': 2647680, 'steps': 13789, 'loss/train': 2.097891330718994} +11/06/2021 23:09:08 - INFO - __main__ - Step 13791: {'lr': 0.0004922116405684832, 'samples': 2647872, 'steps': 13790, 'loss/train': 1.7721515893936157} +11/06/2021 23:09:08 - INFO - __main__ - Step 13792: {'lr': 0.0004922103262363621, 'samples': 2648064, 'steps': 13791, 'loss/train': 1.5414934158325195} +11/06/2021 23:09:09 - INFO - __main__ - Step 13793: {'lr': 0.0004922090117951047, 'samples': 2648256, 'steps': 13792, 'loss/train': 2.323873519897461} +11/06/2021 23:09:09 - INFO - __main__ - Step 13794: {'lr': 0.0004922076972447117, 'samples': 2648448, 'steps': 13793, 'loss/train': 1.157942533493042} +11/06/2021 23:09:10 - INFO - __main__ - Step 13795: {'lr': 0.0004922063825851836, 'samples': 2648640, 'steps': 13794, 'loss/train': 1.609661340713501} +11/06/2021 23:09:10 - INFO - __main__ - Step 13796: {'lr': 0.0004922050678165211, 'samples': 2648832, 'steps': 13795, 'loss/train': 0.9388356804847717} +11/06/2021 23:09:11 - INFO - __main__ - Step 13797: {'lr': 0.0004922037529387247, 'samples': 2649024, 'steps': 13796, 'loss/train': 1.7672147750854492} +11/06/2021 23:09:11 - INFO - __main__ - Step 13798: {'lr': 0.000492202437951795, 'samples': 2649216, 'steps': 13797, 'loss/train': 1.639959454536438} +11/06/2021 23:09:11 - INFO - __main__ - Step 13799: {'lr': 0.0004922011228557327, 'samples': 2649408, 'steps': 13798, 'loss/train': 1.4303568601608276} +11/06/2021 23:09:13 - INFO - __main__ - Step 13800: {'lr': 0.0004921998076505383, 'samples': 2649600, 'steps': 13799, 'loss/train': 1.8134762048721313} +11/06/2021 23:09:13 - INFO - __main__ - Step 13801: {'lr': 0.0004921984923362124, 'samples': 2649792, 'steps': 13800, 'loss/train': 1.5940922498703003} +11/06/2021 23:09:13 - INFO - __main__ - Step 13802: {'lr': 0.0004921971769127555, 'samples': 2649984, 'steps': 13801, 'loss/train': 1.1051990985870361} +11/06/2021 23:09:14 - INFO - __main__ - Step 13803: {'lr': 0.0004921958613801683, 'samples': 2650176, 'steps': 13802, 'loss/train': 1.5847387313842773} +11/06/2021 23:09:14 - INFO - __main__ - Step 13804: {'lr': 0.0004921945457384516, 'samples': 2650368, 'steps': 13803, 'loss/train': 1.840270757675171} +11/06/2021 23:09:15 - INFO - __main__ - Step 13805: {'lr': 0.0004921932299876055, 'samples': 2650560, 'steps': 13804, 'loss/train': 1.712327241897583} +11/06/2021 23:09:15 - INFO - __main__ - Step 13806: {'lr': 0.000492191914127631, 'samples': 2650752, 'steps': 13805, 'loss/train': 2.4084267616271973} +11/06/2021 23:09:16 - INFO - __main__ - Step 13807: {'lr': 0.0004921905981585286, 'samples': 2650944, 'steps': 13806, 'loss/train': 1.3894824981689453} +11/06/2021 23:09:16 - INFO - __main__ - Step 13808: {'lr': 0.0004921892820802988, 'samples': 2651136, 'steps': 13807, 'loss/train': 1.7391257286071777} +11/06/2021 23:09:16 - INFO - __main__ - Step 13809: {'lr': 0.0004921879658929422, 'samples': 2651328, 'steps': 13808, 'loss/train': 4.748656272888184} +11/06/2021 23:09:17 - INFO - __main__ - Step 13810: {'lr': 0.0004921866495964594, 'samples': 2651520, 'steps': 13809, 'loss/train': 1.1638247966766357} +11/06/2021 23:09:18 - INFO - __main__ - Step 13811: {'lr': 0.0004921853331908512, 'samples': 2651712, 'steps': 13810, 'loss/train': 1.9072991609573364} +11/06/2021 23:09:18 - INFO - __main__ - Step 13812: {'lr': 0.000492184016676118, 'samples': 2651904, 'steps': 13811, 'loss/train': 2.309782028198242} +11/06/2021 23:09:18 - INFO - __main__ - Step 13813: {'lr': 0.0004921827000522603, 'samples': 2652096, 'steps': 13812, 'loss/train': 1.5911425352096558} +11/06/2021 23:09:19 - INFO - __main__ - Step 13814: {'lr': 0.0004921813833192788, 'samples': 2652288, 'steps': 13813, 'loss/train': 1.9693739414215088} +11/06/2021 23:09:19 - INFO - __main__ - Step 13815: {'lr': 0.0004921800664771743, 'samples': 2652480, 'steps': 13814, 'loss/train': 1.7779452800750732} +11/06/2021 23:09:20 - INFO - __main__ - Step 13816: {'lr': 0.0004921787495259471, 'samples': 2652672, 'steps': 13815, 'loss/train': 1.5039100646972656} +11/06/2021 23:09:21 - INFO - __main__ - Step 13817: {'lr': 0.0004921774324655978, 'samples': 2652864, 'steps': 13816, 'loss/train': 1.054052472114563} +11/06/2021 23:09:21 - INFO - __main__ - Step 13818: {'lr': 0.0004921761152961271, 'samples': 2653056, 'steps': 13817, 'loss/train': 2.0499536991119385} +11/06/2021 23:09:21 - INFO - __main__ - Step 13819: {'lr': 0.0004921747980175357, 'samples': 2653248, 'steps': 13818, 'loss/train': 1.8573100566864014} +11/06/2021 23:09:22 - INFO - __main__ - Step 13820: {'lr': 0.0004921734806298241, 'samples': 2653440, 'steps': 13819, 'loss/train': 1.531470775604248} +11/06/2021 23:09:23 - INFO - __main__ - Step 13821: {'lr': 0.0004921721631329927, 'samples': 2653632, 'steps': 13820, 'loss/train': 3.0055086612701416} +11/06/2021 23:09:23 - INFO - __main__ - Step 13822: {'lr': 0.0004921708455270424, 'samples': 2653824, 'steps': 13821, 'loss/train': 1.5940738916397095} +11/06/2021 23:09:23 - INFO - __main__ - Step 13823: {'lr': 0.0004921695278119736, 'samples': 2654016, 'steps': 13822, 'loss/train': 2.001136541366577} +11/06/2021 23:09:24 - INFO - __main__ - Step 13824: {'lr': 0.0004921682099877869, 'samples': 2654208, 'steps': 13823, 'loss/train': 1.7149298191070557} +11/06/2021 23:09:24 - INFO - __main__ - Step 13825: {'lr': 0.000492166892054483, 'samples': 2654400, 'steps': 13824, 'loss/train': 1.6777122020721436} +11/06/2021 23:09:25 - INFO - __main__ - Step 13826: {'lr': 0.0004921655740120623, 'samples': 2654592, 'steps': 13825, 'loss/train': 1.5764762163162231} +11/06/2021 23:09:25 - INFO - __main__ - Step 13827: {'lr': 0.0004921642558605257, 'samples': 2654784, 'steps': 13826, 'loss/train': 1.0914108753204346} +11/06/2021 23:09:26 - INFO - __main__ - Step 13828: {'lr': 0.0004921629375998736, 'samples': 2654976, 'steps': 13827, 'loss/train': 1.5501351356506348} +11/06/2021 23:09:26 - INFO - __main__ - Step 13829: {'lr': 0.0004921616192301065, 'samples': 2655168, 'steps': 13828, 'loss/train': 0.7807660102844238} +11/06/2021 23:09:26 - INFO - __main__ - Step 13830: {'lr': 0.0004921603007512253, 'samples': 2655360, 'steps': 13829, 'loss/train': 1.8146405220031738} +11/06/2021 23:09:28 - INFO - __main__ - Step 13831: {'lr': 0.0004921589821632302, 'samples': 2655552, 'steps': 13830, 'loss/train': 1.731347680091858} +11/06/2021 23:09:28 - INFO - __main__ - Step 13832: {'lr': 0.0004921576634661221, 'samples': 2655744, 'steps': 13831, 'loss/train': 1.670548439025879} +11/06/2021 23:09:28 - INFO - __main__ - Step 13833: {'lr': 0.0004921563446599015, 'samples': 2655936, 'steps': 13832, 'loss/train': 1.5320069789886475} +11/06/2021 23:09:29 - INFO - __main__ - Step 13834: {'lr': 0.000492155025744569, 'samples': 2656128, 'steps': 13833, 'loss/train': 1.0628443956375122} +11/06/2021 23:09:29 - INFO - __main__ - Step 13835: {'lr': 0.0004921537067201252, 'samples': 2656320, 'steps': 13834, 'loss/train': 2.1405911445617676} +11/06/2021 23:09:30 - INFO - __main__ - Step 13836: {'lr': 0.0004921523875865706, 'samples': 2656512, 'steps': 13835, 'loss/train': 1.0246696472167969} +11/06/2021 23:09:30 - INFO - __main__ - Step 13837: {'lr': 0.000492151068343906, 'samples': 2656704, 'steps': 13836, 'loss/train': 1.8948359489440918} +11/06/2021 23:09:31 - INFO - __main__ - Step 13838: {'lr': 0.0004921497489921318, 'samples': 2656896, 'steps': 13837, 'loss/train': 1.7364670038223267} +11/06/2021 23:09:31 - INFO - __main__ - Step 13839: {'lr': 0.0004921484295312485, 'samples': 2657088, 'steps': 13838, 'loss/train': 1.4942817687988281} +11/06/2021 23:09:31 - INFO - __main__ - Step 13840: {'lr': 0.0004921471099612571, 'samples': 2657280, 'steps': 13839, 'loss/train': 1.2678571939468384} +11/06/2021 23:09:32 - INFO - __main__ - Step 13841: {'lr': 0.0004921457902821578, 'samples': 2657472, 'steps': 13840, 'loss/train': 1.7979927062988281} +11/06/2021 23:09:33 - INFO - __main__ - Step 13842: {'lr': 0.0004921444704939514, 'samples': 2657664, 'steps': 13841, 'loss/train': 1.2086461782455444} +11/06/2021 23:09:33 - INFO - __main__ - Step 13843: {'lr': 0.0004921431505966384, 'samples': 2657856, 'steps': 13842, 'loss/train': 2.1114842891693115} +11/06/2021 23:09:33 - INFO - __main__ - Step 13844: {'lr': 0.0004921418305902194, 'samples': 2658048, 'steps': 13843, 'loss/train': 1.7268887758255005} +11/06/2021 23:09:34 - INFO - __main__ - Step 13845: {'lr': 0.0004921405104746951, 'samples': 2658240, 'steps': 13844, 'loss/train': 1.4159009456634521} +11/06/2021 23:09:35 - INFO - __main__ - Step 13846: {'lr': 0.0004921391902500661, 'samples': 2658432, 'steps': 13845, 'loss/train': 0.772130012512207} +11/06/2021 23:09:35 - INFO - __main__ - Step 13847: {'lr': 0.0004921378699163328, 'samples': 2658624, 'steps': 13846, 'loss/train': 1.6413114070892334} +11/06/2021 23:09:35 - INFO - __main__ - Step 13848: {'lr': 0.0004921365494734959, 'samples': 2658816, 'steps': 13847, 'loss/train': 2.0871777534484863} +11/06/2021 23:09:36 - INFO - __main__ - Step 13849: {'lr': 0.0004921352289215561, 'samples': 2659008, 'steps': 13848, 'loss/train': 1.6378384828567505} +11/06/2021 23:09:36 - INFO - __main__ - Step 13850: {'lr': 0.0004921339082605137, 'samples': 2659200, 'steps': 13849, 'loss/train': 1.849760890007019} +11/06/2021 23:09:37 - INFO - __main__ - Step 13851: {'lr': 0.0004921325874903697, 'samples': 2659392, 'steps': 13850, 'loss/train': 1.766753077507019} +11/06/2021 23:09:38 - INFO - __main__ - Step 13852: {'lr': 0.0004921312666111245, 'samples': 2659584, 'steps': 13851, 'loss/train': 1.397715449333191} +11/06/2021 23:09:38 - INFO - __main__ - Step 13853: {'lr': 0.0004921299456227785, 'samples': 2659776, 'steps': 13852, 'loss/train': 1.6967663764953613} +11/06/2021 23:09:38 - INFO - __main__ - Step 13854: {'lr': 0.0004921286245253327, 'samples': 2659968, 'steps': 13853, 'loss/train': 1.3301624059677124} +11/06/2021 23:09:39 - INFO - __main__ - Step 13855: {'lr': 0.0004921273033187874, 'samples': 2660160, 'steps': 13854, 'loss/train': 2.2361197471618652} +11/06/2021 23:09:39 - INFO - __main__ - Step 13856: {'lr': 0.0004921259820031431, 'samples': 2660352, 'steps': 13855, 'loss/train': 1.5160555839538574} +11/06/2021 23:09:40 - INFO - __main__ - Step 13857: {'lr': 0.0004921246605784008, 'samples': 2660544, 'steps': 13856, 'loss/train': 1.797963261604309} +11/06/2021 23:09:40 - INFO - __main__ - Step 13858: {'lr': 0.0004921233390445608, 'samples': 2660736, 'steps': 13857, 'loss/train': 1.6788036823272705} +11/06/2021 23:09:41 - INFO - __main__ - Step 13859: {'lr': 0.0004921220174016238, 'samples': 2660928, 'steps': 13858, 'loss/train': 1.196427345275879} +11/06/2021 23:09:41 - INFO - __main__ - Step 13860: {'lr': 0.0004921206956495903, 'samples': 2661120, 'steps': 13859, 'loss/train': 0.5547469854354858} +11/06/2021 23:09:42 - INFO - __main__ - Step 13861: {'lr': 0.000492119373788461, 'samples': 2661312, 'steps': 13860, 'loss/train': 1.9061776399612427} +11/06/2021 23:09:42 - INFO - __main__ - Step 13862: {'lr': 0.0004921180518182363, 'samples': 2661504, 'steps': 13861, 'loss/train': 1.7613266706466675} +11/06/2021 23:09:43 - INFO - __main__ - Step 13863: {'lr': 0.0004921167297389171, 'samples': 2661696, 'steps': 13862, 'loss/train': 1.3482214212417603} +11/06/2021 23:09:43 - INFO - __main__ - Step 13864: {'lr': 0.0004921154075505038, 'samples': 2661888, 'steps': 13863, 'loss/train': 1.8354885578155518} +11/06/2021 23:09:44 - INFO - __main__ - Step 13865: {'lr': 0.0004921140852529969, 'samples': 2662080, 'steps': 13864, 'loss/train': 1.8951635360717773} +11/06/2021 23:09:44 - INFO - __main__ - Step 13866: {'lr': 0.0004921127628463972, 'samples': 2662272, 'steps': 13865, 'loss/train': 1.8773669004440308} +11/06/2021 23:09:44 - INFO - __main__ - Step 13867: {'lr': 0.0004921114403307053, 'samples': 2662464, 'steps': 13866, 'loss/train': 1.8073745965957642} +11/06/2021 23:09:45 - INFO - __main__ - Step 13868: {'lr': 0.0004921101177059218, 'samples': 2662656, 'steps': 13867, 'loss/train': 2.099315881729126} +11/06/2021 23:09:46 - INFO - __main__ - Step 13869: {'lr': 0.0004921087949720471, 'samples': 2662848, 'steps': 13868, 'loss/train': 1.927840232849121} +11/06/2021 23:09:46 - INFO - __main__ - Step 13870: {'lr': 0.0004921074721290819, 'samples': 2663040, 'steps': 13869, 'loss/train': 1.8711230754852295} +11/06/2021 23:09:46 - INFO - __main__ - Step 13871: {'lr': 0.0004921061491770268, 'samples': 2663232, 'steps': 13870, 'loss/train': 1.5287330150604248} +11/06/2021 23:09:47 - INFO - __main__ - Step 13872: {'lr': 0.0004921048261158825, 'samples': 2663424, 'steps': 13871, 'loss/train': 1.6624870300292969} +11/06/2021 23:09:48 - INFO - __main__ - Step 13873: {'lr': 0.0004921035029456493, 'samples': 2663616, 'steps': 13872, 'loss/train': 1.8428698778152466} +11/06/2021 23:09:48 - INFO - __main__ - Step 13874: {'lr': 0.0004921021796663282, 'samples': 2663808, 'steps': 13873, 'loss/train': 1.4383753538131714} +11/06/2021 23:09:49 - INFO - __main__ - Step 13875: {'lr': 0.0004921008562779195, 'samples': 2664000, 'steps': 13874, 'loss/train': 1.4360547065734863} +11/06/2021 23:09:49 - INFO - __main__ - Step 13876: {'lr': 0.0004920995327804239, 'samples': 2664192, 'steps': 13875, 'loss/train': 1.6160893440246582} +11/06/2021 23:09:49 - INFO - __main__ - Step 13877: {'lr': 0.000492098209173842, 'samples': 2664384, 'steps': 13876, 'loss/train': 1.0459492206573486} +11/06/2021 23:09:50 - INFO - __main__ - Step 13878: {'lr': 0.0004920968854581745, 'samples': 2664576, 'steps': 13877, 'loss/train': 1.7214491367340088} +11/06/2021 23:09:51 - INFO - __main__ - Step 13879: {'lr': 0.0004920955616334216, 'samples': 2664768, 'steps': 13878, 'loss/train': 1.4879608154296875} +11/06/2021 23:09:51 - INFO - __main__ - Step 13880: {'lr': 0.0004920942376995844, 'samples': 2664960, 'steps': 13879, 'loss/train': 1.7275727987289429} +11/06/2021 23:09:51 - INFO - __main__ - Step 13881: {'lr': 0.0004920929136566632, 'samples': 2665152, 'steps': 13880, 'loss/train': 1.556997299194336} +11/06/2021 23:09:52 - INFO - __main__ - Step 13882: {'lr': 0.0004920915895046587, 'samples': 2665344, 'steps': 13881, 'loss/train': 1.629291296005249} +11/06/2021 23:09:52 - INFO - __main__ - Step 13883: {'lr': 0.0004920902652435715, 'samples': 2665536, 'steps': 13882, 'loss/train': 2.0257277488708496} +11/06/2021 23:09:53 - INFO - __main__ - Step 13884: {'lr': 0.0004920889408734021, 'samples': 2665728, 'steps': 13883, 'loss/train': 1.8871136903762817} +11/06/2021 23:09:53 - INFO - __main__ - Step 13885: {'lr': 0.0004920876163941511, 'samples': 2665920, 'steps': 13884, 'loss/train': 1.1255569458007812} +11/06/2021 23:09:54 - INFO - __main__ - Step 13886: {'lr': 0.0004920862918058192, 'samples': 2666112, 'steps': 13885, 'loss/train': 1.7489358186721802} +11/06/2021 23:09:54 - INFO - __main__ - Step 13887: {'lr': 0.000492084967108407, 'samples': 2666304, 'steps': 13886, 'loss/train': 2.234173536300659} +11/06/2021 23:09:54 - INFO - __main__ - Step 13888: {'lr': 0.000492083642301915, 'samples': 2666496, 'steps': 13887, 'loss/train': 1.7307212352752686} +11/06/2021 23:09:56 - INFO - __main__ - Step 13889: {'lr': 0.0004920823173863439, 'samples': 2666688, 'steps': 13888, 'loss/train': 1.4370955228805542} +11/06/2021 23:09:56 - INFO - __main__ - Step 13890: {'lr': 0.0004920809923616942, 'samples': 2666880, 'steps': 13889, 'loss/train': 1.8873080015182495} +11/06/2021 23:09:56 - INFO - __main__ - Step 13891: {'lr': 0.0004920796672279666, 'samples': 2667072, 'steps': 13890, 'loss/train': 1.8920522928237915} +11/06/2021 23:09:57 - INFO - __main__ - Step 13892: {'lr': 0.0004920783419851615, 'samples': 2667264, 'steps': 13891, 'loss/train': 5.647333145141602} +11/06/2021 23:09:57 - INFO - __main__ - Step 13893: {'lr': 0.0004920770166332798, 'samples': 2667456, 'steps': 13892, 'loss/train': 1.972109317779541} +11/06/2021 23:09:57 - INFO - __main__ - Step 13894: {'lr': 0.0004920756911723219, 'samples': 2667648, 'steps': 13893, 'loss/train': 2.5524847507476807} +11/06/2021 23:09:59 - INFO - __main__ - Step 13895: {'lr': 0.0004920743656022884, 'samples': 2667840, 'steps': 13894, 'loss/train': 1.815747618675232} +11/06/2021 23:09:59 - INFO - __main__ - Step 13896: {'lr': 0.0004920730399231799, 'samples': 2668032, 'steps': 13895, 'loss/train': 1.4550343751907349} +11/06/2021 23:09:59 - INFO - __main__ - Step 13897: {'lr': 0.000492071714134997, 'samples': 2668224, 'steps': 13896, 'loss/train': 1.4864250421524048} +11/06/2021 23:10:00 - INFO - __main__ - Step 13898: {'lr': 0.0004920703882377403, 'samples': 2668416, 'steps': 13897, 'loss/train': 1.741361141204834} +11/06/2021 23:10:00 - INFO - __main__ - Step 13899: {'lr': 0.0004920690622314105, 'samples': 2668608, 'steps': 13898, 'loss/train': 2.994898796081543} +11/06/2021 23:10:01 - INFO - __main__ - Step 13900: {'lr': 0.0004920677361160081, 'samples': 2668800, 'steps': 13899, 'loss/train': 1.8634357452392578} +11/06/2021 23:10:01 - INFO - __main__ - Step 13901: {'lr': 0.0004920664098915337, 'samples': 2668992, 'steps': 13900, 'loss/train': 1.6608809232711792} +11/06/2021 23:10:02 - INFO - __main__ - Step 13902: {'lr': 0.000492065083557988, 'samples': 2669184, 'steps': 13901, 'loss/train': 1.932618260383606} +11/06/2021 23:10:02 - INFO - __main__ - Step 13903: {'lr': 0.0004920637571153713, 'samples': 2669376, 'steps': 13902, 'loss/train': 1.4454110860824585} +11/06/2021 23:10:02 - INFO - __main__ - Step 13904: {'lr': 0.0004920624305636846, 'samples': 2669568, 'steps': 13903, 'loss/train': 1.8593177795410156} +11/06/2021 23:10:03 - INFO - __main__ - Step 13905: {'lr': 0.0004920611039029283, 'samples': 2669760, 'steps': 13904, 'loss/train': 1.7864686250686646} +11/06/2021 23:10:05 - INFO - __main__ - Step 13906: {'lr': 0.0004920597771331029, 'samples': 2669952, 'steps': 13905, 'loss/train': 2.002392292022705} +11/06/2021 23:10:05 - INFO - __main__ - Step 13907: {'lr': 0.0004920584502542091, 'samples': 2670144, 'steps': 13906, 'loss/train': 0.30893194675445557} +11/06/2021 23:10:06 - INFO - __main__ - Step 13908: {'lr': 0.0004920571232662475, 'samples': 2670336, 'steps': 13907, 'loss/train': 1.9505276679992676} +11/06/2021 23:10:06 - INFO - __main__ - Step 13909: {'lr': 0.0004920557961692188, 'samples': 2670528, 'steps': 13908, 'loss/train': 1.9398505687713623} +11/06/2021 23:10:06 - INFO - __main__ - Step 13910: {'lr': 0.0004920544689631233, 'samples': 2670720, 'steps': 13909, 'loss/train': 2.0230226516723633} +11/06/2021 23:10:07 - INFO - __main__ - Step 13911: {'lr': 0.000492053141647962, 'samples': 2670912, 'steps': 13910, 'loss/train': 1.8889321088790894} +11/06/2021 23:10:07 - INFO - __main__ - Step 13912: {'lr': 0.0004920518142237352, 'samples': 2671104, 'steps': 13911, 'loss/train': 1.33417809009552} +11/06/2021 23:10:07 - INFO - __main__ - Step 13913: {'lr': 0.0004920504866904436, 'samples': 2671296, 'steps': 13912, 'loss/train': 1.29556143283844} +11/06/2021 23:10:09 - INFO - __main__ - Step 13914: {'lr': 0.0004920491590480878, 'samples': 2671488, 'steps': 13913, 'loss/train': 1.9679369926452637} +11/06/2021 23:10:09 - INFO - __main__ - Step 13915: {'lr': 0.0004920478312966683, 'samples': 2671680, 'steps': 13914, 'loss/train': 1.3328757286071777} +11/06/2021 23:10:09 - INFO - __main__ - Step 13916: {'lr': 0.0004920465034361859, 'samples': 2671872, 'steps': 13915, 'loss/train': 1.5501303672790527} +11/06/2021 23:10:10 - INFO - __main__ - Step 13917: {'lr': 0.000492045175466641, 'samples': 2672064, 'steps': 13916, 'loss/train': 1.871131181716919} +11/06/2021 23:10:10 - INFO - __main__ - Step 13918: {'lr': 0.0004920438473880344, 'samples': 2672256, 'steps': 13917, 'loss/train': 2.702326536178589} +11/06/2021 23:10:11 - INFO - __main__ - Step 13919: {'lr': 0.0004920425192003663, 'samples': 2672448, 'steps': 13918, 'loss/train': 1.7303717136383057} +11/06/2021 23:10:11 - INFO - __main__ - Step 13920: {'lr': 0.0004920411909036379, 'samples': 2672640, 'steps': 13919, 'loss/train': 1.9704726934432983} +11/06/2021 23:10:12 - INFO - __main__ - Step 13921: {'lr': 0.0004920398624978493, 'samples': 2672832, 'steps': 13920, 'loss/train': 1.4717364311218262} +11/06/2021 23:10:12 - INFO - __main__ - Step 13922: {'lr': 0.0004920385339830012, 'samples': 2673024, 'steps': 13921, 'loss/train': 1.7774920463562012} +11/06/2021 23:10:12 - INFO - __main__ - Step 13923: {'lr': 0.0004920372053590945, 'samples': 2673216, 'steps': 13922, 'loss/train': 1.853239893913269} +11/06/2021 23:10:13 - INFO - __main__ - Step 13924: {'lr': 0.0004920358766261294, 'samples': 2673408, 'steps': 13923, 'loss/train': 1.9390660524368286} +11/06/2021 23:10:14 - INFO - __main__ - Step 13925: {'lr': 0.0004920345477841067, 'samples': 2673600, 'steps': 13924, 'loss/train': 2.0693888664245605} +11/06/2021 23:10:14 - INFO - __main__ - Step 13926: {'lr': 0.000492033218833027, 'samples': 2673792, 'steps': 13925, 'loss/train': 1.8519387245178223} +11/06/2021 23:10:14 - INFO - __main__ - Step 13927: {'lr': 0.0004920318897728909, 'samples': 2673984, 'steps': 13926, 'loss/train': 1.803276538848877} +11/06/2021 23:10:15 - INFO - __main__ - Step 13928: {'lr': 0.0004920305606036988, 'samples': 2674176, 'steps': 13927, 'loss/train': 1.768867015838623} +11/06/2021 23:10:16 - INFO - __main__ - Step 13929: {'lr': 0.0004920292313254516, 'samples': 2674368, 'steps': 13928, 'loss/train': 2.1696088314056396} +11/06/2021 23:10:16 - INFO - __main__ - Step 13930: {'lr': 0.0004920279019381497, 'samples': 2674560, 'steps': 13929, 'loss/train': 2.3505563735961914} +11/06/2021 23:10:16 - INFO - __main__ - Step 13931: {'lr': 0.0004920265724417938, 'samples': 2674752, 'steps': 13930, 'loss/train': 0.4778132736682892} +11/06/2021 23:10:17 - INFO - __main__ - Step 13932: {'lr': 0.0004920252428363845, 'samples': 2674944, 'steps': 13931, 'loss/train': 1.7751408815383911} +11/06/2021 23:10:17 - INFO - __main__ - Step 13933: {'lr': 0.0004920239131219223, 'samples': 2675136, 'steps': 13932, 'loss/train': 0.7648064494132996} +11/06/2021 23:10:18 - INFO - __main__ - Step 13934: {'lr': 0.0004920225832984079, 'samples': 2675328, 'steps': 13933, 'loss/train': 1.5931404829025269} +11/06/2021 23:10:18 - INFO - __main__ - Step 13935: {'lr': 0.0004920212533658419, 'samples': 2675520, 'steps': 13934, 'loss/train': 2.218579053878784} +11/06/2021 23:10:19 - INFO - __main__ - Step 13936: {'lr': 0.0004920199233242247, 'samples': 2675712, 'steps': 13935, 'loss/train': 1.7814935445785522} +11/06/2021 23:10:19 - INFO - __main__ - Step 13937: {'lr': 0.0004920185931735572, 'samples': 2675904, 'steps': 13936, 'loss/train': 1.8334205150604248} +11/06/2021 23:10:20 - INFO - __main__ - Step 13938: {'lr': 0.0004920172629138399, 'samples': 2676096, 'steps': 13937, 'loss/train': 1.7788243293762207} +11/06/2021 23:10:20 - INFO - __main__ - Step 13939: {'lr': 0.0004920159325450731, 'samples': 2676288, 'steps': 13938, 'loss/train': 1.6450157165527344} +11/06/2021 23:10:21 - INFO - __main__ - Step 13940: {'lr': 0.0004920146020672578, 'samples': 2676480, 'steps': 13939, 'loss/train': 1.6414921283721924} +11/06/2021 23:10:21 - INFO - __main__ - Step 13941: {'lr': 0.0004920132714803946, 'samples': 2676672, 'steps': 13940, 'loss/train': 1.8297538757324219} +11/06/2021 23:10:22 - INFO - __main__ - Step 13942: {'lr': 0.0004920119407844838, 'samples': 2676864, 'steps': 13941, 'loss/train': 1.148298978805542} +11/06/2021 23:10:22 - INFO - __main__ - Step 13943: {'lr': 0.0004920106099795262, 'samples': 2677056, 'steps': 13942, 'loss/train': 2.2544357776641846} +11/06/2021 23:10:22 - INFO - __main__ - Step 13944: {'lr': 0.0004920092790655224, 'samples': 2677248, 'steps': 13943, 'loss/train': 2.0402214527130127} +11/06/2021 23:10:24 - INFO - __main__ - Step 13945: {'lr': 0.0004920079480424728, 'samples': 2677440, 'steps': 13944, 'loss/train': 1.6051249504089355} +11/06/2021 23:10:24 - INFO - __main__ - Step 13946: {'lr': 0.0004920066169103783, 'samples': 2677632, 'steps': 13945, 'loss/train': 1.0051872730255127} +11/06/2021 23:10:24 - INFO - __main__ - Step 13947: {'lr': 0.0004920052856692394, 'samples': 2677824, 'steps': 13946, 'loss/train': 1.7988791465759277} +11/06/2021 23:10:25 - INFO - __main__ - Step 13948: {'lr': 0.0004920039543190565, 'samples': 2678016, 'steps': 13947, 'loss/train': 1.3910020589828491} +11/06/2021 23:10:25 - INFO - __main__ - Step 13949: {'lr': 0.0004920026228598303, 'samples': 2678208, 'steps': 13948, 'loss/train': 1.5859302282333374} +11/06/2021 23:10:26 - INFO - __main__ - Step 13950: {'lr': 0.0004920012912915616, 'samples': 2678400, 'steps': 13949, 'loss/train': 1.9164284467697144} +11/06/2021 23:10:26 - INFO - __main__ - Step 13951: {'lr': 0.0004919999596142508, 'samples': 2678592, 'steps': 13950, 'loss/train': 1.7975435256958008} +11/06/2021 23:10:27 - INFO - __main__ - Step 13952: {'lr': 0.0004919986278278986, 'samples': 2678784, 'steps': 13951, 'loss/train': 1.8759640455245972} +11/06/2021 23:10:27 - INFO - __main__ - Step 13953: {'lr': 0.0004919972959325055, 'samples': 2678976, 'steps': 13952, 'loss/train': 2.344235420227051} +11/06/2021 23:10:27 - INFO - __main__ - Step 13954: {'lr': 0.0004919959639280722, 'samples': 2679168, 'steps': 13953, 'loss/train': 3.453373432159424} +11/06/2021 23:10:28 - INFO - __main__ - Step 13955: {'lr': 0.0004919946318145992, 'samples': 2679360, 'steps': 13954, 'loss/train': 2.145124673843384} +11/06/2021 23:10:29 - INFO - __main__ - Step 13956: {'lr': 0.0004919932995920872, 'samples': 2679552, 'steps': 13955, 'loss/train': 1.7001293897628784} +11/06/2021 23:10:29 - INFO - __main__ - Step 13957: {'lr': 0.0004919919672605366, 'samples': 2679744, 'steps': 13956, 'loss/train': 1.792694330215454} +11/06/2021 23:10:29 - INFO - __main__ - Step 13958: {'lr': 0.0004919906348199483, 'samples': 2679936, 'steps': 13957, 'loss/train': 1.8448896408081055} +11/06/2021 23:10:30 - INFO - __main__ - Step 13959: {'lr': 0.0004919893022703228, 'samples': 2680128, 'steps': 13958, 'loss/train': 1.7649340629577637} +11/06/2021 23:10:31 - INFO - __main__ - Step 13960: {'lr': 0.0004919879696116605, 'samples': 2680320, 'steps': 13959, 'loss/train': 1.3440182209014893} +11/06/2021 23:10:31 - INFO - __main__ - Step 13961: {'lr': 0.0004919866368439624, 'samples': 2680512, 'steps': 13960, 'loss/train': 2.0946123600006104} +11/06/2021 23:10:31 - INFO - __main__ - Step 13962: {'lr': 0.0004919853039672287, 'samples': 2680704, 'steps': 13961, 'loss/train': 1.806232213973999} +11/06/2021 23:10:32 - INFO - __main__ - Step 13963: {'lr': 0.00049198397098146, 'samples': 2680896, 'steps': 13962, 'loss/train': 2.475085496902466} +11/06/2021 23:10:32 - INFO - __main__ - Step 13964: {'lr': 0.0004919826378866573, 'samples': 2681088, 'steps': 13963, 'loss/train': 1.6275722980499268} +11/06/2021 23:10:33 - INFO - __main__ - Step 13965: {'lr': 0.0004919813046828209, 'samples': 2681280, 'steps': 13964, 'loss/train': 1.4893933534622192} +11/06/2021 23:10:34 - INFO - __main__ - Step 13966: {'lr': 0.0004919799713699514, 'samples': 2681472, 'steps': 13965, 'loss/train': 1.8989421129226685} +11/06/2021 23:10:34 - INFO - __main__ - Step 13967: {'lr': 0.0004919786379480494, 'samples': 2681664, 'steps': 13966, 'loss/train': 2.0461950302124023} +11/06/2021 23:10:34 - INFO - __main__ - Step 13968: {'lr': 0.0004919773044171158, 'samples': 2681856, 'steps': 13967, 'loss/train': 1.7117947340011597} +11/06/2021 23:10:35 - INFO - __main__ - Step 13969: {'lr': 0.0004919759707771507, 'samples': 2682048, 'steps': 13968, 'loss/train': 1.7647126913070679} +11/06/2021 23:10:35 - INFO - __main__ - Step 13970: {'lr': 0.0004919746370281551, 'samples': 2682240, 'steps': 13969, 'loss/train': 1.784766435623169} +11/06/2021 23:10:36 - INFO - __main__ - Step 13971: {'lr': 0.0004919733031701295, 'samples': 2682432, 'steps': 13970, 'loss/train': 1.7901809215545654} +11/06/2021 23:10:37 - INFO - __main__ - Step 13972: {'lr': 0.0004919719692030743, 'samples': 2682624, 'steps': 13971, 'loss/train': 1.4720513820648193} +11/06/2021 23:10:37 - INFO - __main__ - Step 13973: {'lr': 0.0004919706351269904, 'samples': 2682816, 'steps': 13972, 'loss/train': 1.9798334836959839} +11/06/2021 23:10:37 - INFO - __main__ - Step 13974: {'lr': 0.0004919693009418782, 'samples': 2683008, 'steps': 13973, 'loss/train': 2.224214553833008} +11/06/2021 23:10:38 - INFO - __main__ - Step 13975: {'lr': 0.0004919679666477384, 'samples': 2683200, 'steps': 13974, 'loss/train': 1.7048498392105103} +11/06/2021 23:10:39 - INFO - __main__ - Step 13976: {'lr': 0.0004919666322445715, 'samples': 2683392, 'steps': 13975, 'loss/train': 1.784834384918213} +11/06/2021 23:10:39 - INFO - __main__ - Step 13977: {'lr': 0.0004919652977323783, 'samples': 2683584, 'steps': 13976, 'loss/train': 1.4972141981124878} +11/06/2021 23:10:39 - INFO - __main__ - Step 13978: {'lr': 0.0004919639631111592, 'samples': 2683776, 'steps': 13977, 'loss/train': 1.7331345081329346} +11/06/2021 23:10:40 - INFO - __main__ - Step 13979: {'lr': 0.0004919626283809149, 'samples': 2683968, 'steps': 13978, 'loss/train': 1.7867261171340942} +11/06/2021 23:10:40 - INFO - __main__ - Step 13980: {'lr': 0.0004919612935416459, 'samples': 2684160, 'steps': 13979, 'loss/train': 1.5536366701126099} +11/06/2021 23:10:41 - INFO - __main__ - Step 13981: {'lr': 0.000491959958593353, 'samples': 2684352, 'steps': 13980, 'loss/train': 1.6696289777755737} +11/06/2021 23:10:41 - INFO - __main__ - Step 13982: {'lr': 0.0004919586235360365, 'samples': 2684544, 'steps': 13981, 'loss/train': 1.6226602792739868} +11/06/2021 23:10:42 - INFO - __main__ - Step 13983: {'lr': 0.0004919572883696974, 'samples': 2684736, 'steps': 13982, 'loss/train': 1.9969899654388428} +11/06/2021 23:10:42 - INFO - __main__ - Step 13984: {'lr': 0.0004919559530943359, 'samples': 2684928, 'steps': 13983, 'loss/train': 1.8502788543701172} +11/06/2021 23:10:43 - INFO - __main__ - Step 13985: {'lr': 0.0004919546177099528, 'samples': 2685120, 'steps': 13984, 'loss/train': 2.2144908905029297} +11/06/2021 23:10:44 - INFO - __main__ - Step 13986: {'lr': 0.0004919532822165487, 'samples': 2685312, 'steps': 13985, 'loss/train': 1.7305831909179688} +11/06/2021 23:10:44 - INFO - __main__ - Step 13987: {'lr': 0.0004919519466141242, 'samples': 2685504, 'steps': 13986, 'loss/train': 2.206554889678955} +11/06/2021 23:10:44 - INFO - __main__ - Step 13988: {'lr': 0.0004919506109026799, 'samples': 2685696, 'steps': 13987, 'loss/train': 2.002794027328491} +11/06/2021 23:10:45 - INFO - __main__ - Step 13989: {'lr': 0.0004919492750822163, 'samples': 2685888, 'steps': 13988, 'loss/train': 1.8074073791503906} +11/06/2021 23:10:45 - INFO - __main__ - Step 13990: {'lr': 0.0004919479391527343, 'samples': 2686080, 'steps': 13989, 'loss/train': 1.7749497890472412} +11/06/2021 23:10:45 - INFO - __main__ - Step 13991: {'lr': 0.0004919466031142342, 'samples': 2686272, 'steps': 13990, 'loss/train': 1.2076705694198608} +11/06/2021 23:10:46 - INFO - __main__ - Step 13992: {'lr': 0.0004919452669667166, 'samples': 2686464, 'steps': 13991, 'loss/train': 3.3132309913635254} +11/06/2021 23:10:47 - INFO - __main__ - Step 13993: {'lr': 0.0004919439307101822, 'samples': 2686656, 'steps': 13992, 'loss/train': 3.050110101699829} +11/06/2021 23:10:47 - INFO - __main__ - Step 13994: {'lr': 0.0004919425943446317, 'samples': 2686848, 'steps': 13993, 'loss/train': 1.7559268474578857} +11/06/2021 23:10:48 - INFO - __main__ - Step 13995: {'lr': 0.0004919412578700654, 'samples': 2687040, 'steps': 13994, 'loss/train': 1.2231806516647339} +11/06/2021 23:10:48 - INFO - __main__ - Step 13996: {'lr': 0.0004919399212864843, 'samples': 2687232, 'steps': 13995, 'loss/train': 1.859178066253662} +11/06/2021 23:10:48 - INFO - __main__ - Step 13997: {'lr': 0.0004919385845938888, 'samples': 2687424, 'steps': 13996, 'loss/train': 1.9321575164794922} +11/06/2021 23:10:49 - INFO - __main__ - Step 13998: {'lr': 0.0004919372477922794, 'samples': 2687616, 'steps': 13997, 'loss/train': 1.7246944904327393} +11/06/2021 23:10:50 - INFO - __main__ - Step 13999: {'lr': 0.0004919359108816569, 'samples': 2687808, 'steps': 13998, 'loss/train': 2.0384068489074707} +11/06/2021 23:10:50 - INFO - __main__ - Step 14000: {'lr': 0.0004919345738620218, 'samples': 2688000, 'steps': 13999, 'loss/train': 1.2765216827392578} +11/06/2021 23:10:50 - INFO - __main__ - Step 14001: {'lr': 0.0004919332367333747, 'samples': 2688192, 'steps': 14000, 'loss/train': 1.9448779821395874} +11/06/2021 23:10:51 - INFO - __main__ - Step 14002: {'lr': 0.0004919318994957162, 'samples': 2688384, 'steps': 14001, 'loss/train': 1.9251288175582886} +11/06/2021 23:10:52 - INFO - __main__ - Step 14003: {'lr': 0.0004919305621490469, 'samples': 2688576, 'steps': 14002, 'loss/train': 2.482295274734497} +11/06/2021 23:10:52 - INFO - __main__ - Step 14004: {'lr': 0.0004919292246933675, 'samples': 2688768, 'steps': 14003, 'loss/train': 1.9574697017669678} +11/06/2021 23:10:52 - INFO - __main__ - Step 14005: {'lr': 0.0004919278871286785, 'samples': 2688960, 'steps': 14004, 'loss/train': 1.896154761314392} +11/06/2021 23:10:53 - INFO - __main__ - Step 14006: {'lr': 0.0004919265494549805, 'samples': 2689152, 'steps': 14005, 'loss/train': 1.633683681488037} +11/06/2021 23:10:53 - INFO - __main__ - Step 14007: {'lr': 0.0004919252116722742, 'samples': 2689344, 'steps': 14006, 'loss/train': 1.4971553087234497} +11/06/2021 23:10:54 - INFO - __main__ - Step 14008: {'lr': 0.0004919238737805601, 'samples': 2689536, 'steps': 14007, 'loss/train': 1.8007830381393433} +11/06/2021 23:10:55 - INFO - __main__ - Step 14009: {'lr': 0.0004919225357798387, 'samples': 2689728, 'steps': 14008, 'loss/train': 1.9640558958053589} +11/06/2021 23:10:55 - INFO - __main__ - Step 14010: {'lr': 0.000491921197670111, 'samples': 2689920, 'steps': 14009, 'loss/train': 1.3045183420181274} +11/06/2021 23:10:55 - INFO - __main__ - Step 14011: {'lr': 0.0004919198594513771, 'samples': 2690112, 'steps': 14010, 'loss/train': 1.3401371240615845} +11/06/2021 23:10:56 - INFO - __main__ - Step 14012: {'lr': 0.0004919185211236379, 'samples': 2690304, 'steps': 14011, 'loss/train': 1.836495280265808} +11/06/2021 23:10:57 - INFO - __main__ - Step 14013: {'lr': 0.000491917182686894, 'samples': 2690496, 'steps': 14012, 'loss/train': 1.7330890893936157} +11/06/2021 23:10:57 - INFO - __main__ - Step 14014: {'lr': 0.0004919158441411459, 'samples': 2690688, 'steps': 14013, 'loss/train': 1.8115290403366089} +11/06/2021 23:10:57 - INFO - __main__ - Step 14015: {'lr': 0.0004919145054863943, 'samples': 2690880, 'steps': 14014, 'loss/train': 1.6873303651809692} +11/06/2021 23:10:58 - INFO - __main__ - Step 14016: {'lr': 0.0004919131667226398, 'samples': 2691072, 'steps': 14015, 'loss/train': 1.5199148654937744} +11/06/2021 23:10:58 - INFO - __main__ - Step 14017: {'lr': 0.0004919118278498828, 'samples': 2691264, 'steps': 14016, 'loss/train': 1.7640634775161743} +11/06/2021 23:10:58 - INFO - __main__ - Step 14018: {'lr': 0.0004919104888681242, 'samples': 2691456, 'steps': 14017, 'loss/train': 2.0215377807617188} +11/06/2021 23:10:59 - INFO - __main__ - Step 14019: {'lr': 0.0004919091497773643, 'samples': 2691648, 'steps': 14018, 'loss/train': 1.64264976978302} +11/06/2021 23:11:00 - INFO - __main__ - Step 14020: {'lr': 0.0004919078105776041, 'samples': 2691840, 'steps': 14019, 'loss/train': 1.904662013053894} +11/06/2021 23:11:00 - INFO - __main__ - Step 14021: {'lr': 0.0004919064712688439, 'samples': 2692032, 'steps': 14020, 'loss/train': 1.8053239583969116} +11/06/2021 23:11:00 - INFO - __main__ - Step 14022: {'lr': 0.0004919051318510844, 'samples': 2692224, 'steps': 14021, 'loss/train': 2.048910617828369} +11/06/2021 23:11:01 - INFO - __main__ - Step 14023: {'lr': 0.0004919037923243261, 'samples': 2692416, 'steps': 14022, 'loss/train': 1.2819080352783203} +11/06/2021 23:11:02 - INFO - __main__ - Step 14024: {'lr': 0.0004919024526885697, 'samples': 2692608, 'steps': 14023, 'loss/train': 1.1374632120132446} +11/06/2021 23:11:02 - INFO - __main__ - Step 14025: {'lr': 0.0004919011129438158, 'samples': 2692800, 'steps': 14024, 'loss/train': 1.4526000022888184} +11/06/2021 23:11:03 - INFO - __main__ - Step 14026: {'lr': 0.0004918997730900649, 'samples': 2692992, 'steps': 14025, 'loss/train': 1.2924232482910156} +11/06/2021 23:11:03 - INFO - __main__ - Step 14027: {'lr': 0.0004918984331273178, 'samples': 2693184, 'steps': 14026, 'loss/train': 2.08219313621521} +11/06/2021 23:11:03 - INFO - __main__ - Step 14028: {'lr': 0.0004918970930555751, 'samples': 2693376, 'steps': 14027, 'loss/train': 1.7137112617492676} +11/06/2021 23:11:04 - INFO - __main__ - Step 14029: {'lr': 0.0004918957528748371, 'samples': 2693568, 'steps': 14028, 'loss/train': 1.5124090909957886} +11/06/2021 23:11:05 - INFO - __main__ - Step 14030: {'lr': 0.0004918944125851047, 'samples': 2693760, 'steps': 14029, 'loss/train': 1.7956403493881226} +11/06/2021 23:11:05 - INFO - __main__ - Step 14031: {'lr': 0.0004918930721863784, 'samples': 2693952, 'steps': 14030, 'loss/train': 0.82200026512146} +11/06/2021 23:11:05 - INFO - __main__ - Step 14032: {'lr': 0.0004918917316786589, 'samples': 2694144, 'steps': 14031, 'loss/train': 1.9360613822937012} +11/06/2021 23:11:06 - INFO - __main__ - Step 14033: {'lr': 0.0004918903910619465, 'samples': 2694336, 'steps': 14032, 'loss/train': 1.157104253768921} +11/06/2021 23:11:07 - INFO - __main__ - Step 14034: {'lr': 0.0004918890503362422, 'samples': 2694528, 'steps': 14033, 'loss/train': 1.9156838655471802} +11/06/2021 23:11:07 - INFO - __main__ - Step 14035: {'lr': 0.0004918877095015465, 'samples': 2694720, 'steps': 14034, 'loss/train': 2.019812822341919} +11/06/2021 23:11:07 - INFO - __main__ - Step 14036: {'lr': 0.0004918863685578598, 'samples': 2694912, 'steps': 14035, 'loss/train': 1.6677758693695068} +11/06/2021 23:11:08 - INFO - __main__ - Step 14037: {'lr': 0.0004918850275051829, 'samples': 2695104, 'steps': 14036, 'loss/train': 2.457850217819214} +11/06/2021 23:11:08 - INFO - __main__ - Step 14038: {'lr': 0.0004918836863435162, 'samples': 2695296, 'steps': 14037, 'loss/train': 2.003868341445923} +11/06/2021 23:11:09 - INFO - __main__ - Step 14039: {'lr': 0.0004918823450728606, 'samples': 2695488, 'steps': 14038, 'loss/train': 1.5999841690063477} +11/06/2021 23:11:10 - INFO - __main__ - Step 14040: {'lr': 0.0004918810036932164, 'samples': 2695680, 'steps': 14039, 'loss/train': 1.710452675819397} +11/06/2021 23:11:10 - INFO - __main__ - Step 14041: {'lr': 0.0004918796622045844, 'samples': 2695872, 'steps': 14040, 'loss/train': 1.9019668102264404} +11/06/2021 23:11:10 - INFO - __main__ - Step 14042: {'lr': 0.0004918783206069652, 'samples': 2696064, 'steps': 14041, 'loss/train': 1.7770543098449707} +11/06/2021 23:11:11 - INFO - __main__ - Step 14043: {'lr': 0.0004918769789003593, 'samples': 2696256, 'steps': 14042, 'loss/train': 1.4025808572769165} +11/06/2021 23:11:11 - INFO - __main__ - Step 14044: {'lr': 0.0004918756370847674, 'samples': 2696448, 'steps': 14043, 'loss/train': 1.5960426330566406} +11/06/2021 23:11:12 - INFO - __main__ - Step 14045: {'lr': 0.0004918742951601902, 'samples': 2696640, 'steps': 14044, 'loss/train': 1.9002901315689087} +11/06/2021 23:11:12 - INFO - __main__ - Step 14046: {'lr': 0.000491872953126628, 'samples': 2696832, 'steps': 14045, 'loss/train': 1.677998661994934} +11/06/2021 23:11:13 - INFO - __main__ - Step 14047: {'lr': 0.0004918716109840817, 'samples': 2697024, 'steps': 14046, 'loss/train': 1.461251139640808} +11/06/2021 23:11:13 - INFO - __main__ - Step 14048: {'lr': 0.0004918702687325517, 'samples': 2697216, 'steps': 14047, 'loss/train': 1.8989447355270386} +11/06/2021 23:11:13 - INFO - __main__ - Step 14049: {'lr': 0.0004918689263720388, 'samples': 2697408, 'steps': 14048, 'loss/train': 1.1831153631210327} +11/06/2021 23:11:14 - INFO - __main__ - Step 14050: {'lr': 0.0004918675839025434, 'samples': 2697600, 'steps': 14049, 'loss/train': 1.7708138227462769} +11/06/2021 23:11:15 - INFO - __main__ - Step 14051: {'lr': 0.0004918662413240662, 'samples': 2697792, 'steps': 14050, 'loss/train': 1.32278311252594} +11/06/2021 23:11:15 - INFO - __main__ - Step 14052: {'lr': 0.0004918648986366078, 'samples': 2697984, 'steps': 14051, 'loss/train': 1.6384484767913818} +11/06/2021 23:11:15 - INFO - __main__ - Step 14053: {'lr': 0.0004918635558401687, 'samples': 2698176, 'steps': 14052, 'loss/train': 2.0729172229766846} +11/06/2021 23:11:16 - INFO - __main__ - Step 14054: {'lr': 0.0004918622129347498, 'samples': 2698368, 'steps': 14053, 'loss/train': 1.6105602979660034} +11/06/2021 23:11:17 - INFO - __main__ - Step 14055: {'lr': 0.0004918608699203515, 'samples': 2698560, 'steps': 14054, 'loss/train': 2.5296216011047363} +11/06/2021 23:11:17 - INFO - __main__ - Step 14056: {'lr': 0.0004918595267969744, 'samples': 2698752, 'steps': 14055, 'loss/train': 1.7558401823043823} +11/06/2021 23:11:18 - INFO - __main__ - Step 14057: {'lr': 0.0004918581835646191, 'samples': 2698944, 'steps': 14056, 'loss/train': 5.832611083984375} +11/06/2021 23:11:18 - INFO - __main__ - Step 14058: {'lr': 0.0004918568402232863, 'samples': 2699136, 'steps': 14057, 'loss/train': 1.5368565320968628} +11/06/2021 23:11:18 - INFO - __main__ - Step 14059: {'lr': 0.0004918554967729764, 'samples': 2699328, 'steps': 14058, 'loss/train': 2.169316291809082} +11/06/2021 23:11:19 - INFO - __main__ - Step 14060: {'lr': 0.0004918541532136902, 'samples': 2699520, 'steps': 14059, 'loss/train': 2.3635847568511963} +11/06/2021 23:11:20 - INFO - __main__ - Step 14061: {'lr': 0.0004918528095454283, 'samples': 2699712, 'steps': 14060, 'loss/train': 1.7770613431930542} +11/06/2021 23:11:20 - INFO - __main__ - Step 14062: {'lr': 0.0004918514657681913, 'samples': 2699904, 'steps': 14061, 'loss/train': 1.688179850578308} +11/06/2021 23:11:20 - INFO - __main__ - Step 14063: {'lr': 0.0004918501218819796, 'samples': 2700096, 'steps': 14062, 'loss/train': 1.860587239265442} +11/06/2021 23:11:21 - INFO - __main__ - Step 14064: {'lr': 0.0004918487778867941, 'samples': 2700288, 'steps': 14063, 'loss/train': 1.8392343521118164} +11/06/2021 23:11:21 - INFO - __main__ - Step 14065: {'lr': 0.0004918474337826353, 'samples': 2700480, 'steps': 14064, 'loss/train': 1.5922415256500244} +11/06/2021 23:11:22 - INFO - __main__ - Step 14066: {'lr': 0.0004918460895695037, 'samples': 2700672, 'steps': 14065, 'loss/train': 1.585329294204712} +11/06/2021 23:11:23 - INFO - __main__ - Step 14067: {'lr': 0.0004918447452474, 'samples': 2700864, 'steps': 14066, 'loss/train': 3.7865922451019287} +11/06/2021 23:11:23 - INFO - __main__ - Step 14068: {'lr': 0.0004918434008163247, 'samples': 2701056, 'steps': 14067, 'loss/train': 1.2407586574554443} +11/06/2021 23:11:23 - INFO - __main__ - Step 14069: {'lr': 0.0004918420562762786, 'samples': 2701248, 'steps': 14068, 'loss/train': 1.7555322647094727} +11/06/2021 23:11:24 - INFO - __main__ - Step 14070: {'lr': 0.0004918407116272622, 'samples': 2701440, 'steps': 14069, 'loss/train': 1.0781822204589844} +11/06/2021 23:11:24 - INFO - __main__ - Step 14071: {'lr': 0.000491839366869276, 'samples': 2701632, 'steps': 14070, 'loss/train': 2.1765549182891846} +11/06/2021 23:11:25 - INFO - __main__ - Step 14072: {'lr': 0.000491838022002321, 'samples': 2701824, 'steps': 14071, 'loss/train': 1.3922725915908813} +11/06/2021 23:11:25 - INFO - __main__ - Step 14073: {'lr': 0.0004918366770263972, 'samples': 2702016, 'steps': 14072, 'loss/train': 1.583871603012085} +11/06/2021 23:11:26 - INFO - __main__ - Step 14074: {'lr': 0.0004918353319415057, 'samples': 2702208, 'steps': 14073, 'loss/train': 1.4345612525939941} +11/06/2021 23:11:26 - INFO - __main__ - Step 14075: {'lr': 0.0004918339867476469, 'samples': 2702400, 'steps': 14074, 'loss/train': 1.5994923114776611} +11/06/2021 23:11:26 - INFO - __main__ - Step 14076: {'lr': 0.0004918326414448214, 'samples': 2702592, 'steps': 14075, 'loss/train': 2.2489395141601562} +11/06/2021 23:11:28 - INFO - __main__ - Step 14077: {'lr': 0.0004918312960330299, 'samples': 2702784, 'steps': 14076, 'loss/train': 1.737290382385254} +11/06/2021 23:11:28 - INFO - __main__ - Step 14078: {'lr': 0.0004918299505122729, 'samples': 2702976, 'steps': 14077, 'loss/train': 1.7684190273284912} +11/06/2021 23:11:28 - INFO - __main__ - Step 14079: {'lr': 0.000491828604882551, 'samples': 2703168, 'steps': 14078, 'loss/train': 1.933387279510498} +11/06/2021 23:11:29 - INFO - __main__ - Step 14080: {'lr': 0.0004918272591438649, 'samples': 2703360, 'steps': 14079, 'loss/train': 2.6290011405944824} +11/06/2021 23:11:29 - INFO - __main__ - Step 14081: {'lr': 0.0004918259132962153, 'samples': 2703552, 'steps': 14080, 'loss/train': 1.1858018636703491} +11/06/2021 23:11:29 - INFO - __main__ - Step 14082: {'lr': 0.0004918245673396025, 'samples': 2703744, 'steps': 14081, 'loss/train': 1.8530510663986206} +11/06/2021 23:11:31 - INFO - __main__ - Step 14083: {'lr': 0.0004918232212740274, 'samples': 2703936, 'steps': 14082, 'loss/train': 0.8487131595611572} +11/06/2021 23:11:31 - INFO - __main__ - Step 14084: {'lr': 0.0004918218750994904, 'samples': 2704128, 'steps': 14083, 'loss/train': 2.605128288269043} +11/06/2021 23:11:32 - INFO - __main__ - Step 14085: {'lr': 0.0004918205288159923, 'samples': 2704320, 'steps': 14084, 'loss/train': 1.6674420833587646} +11/06/2021 23:11:32 - INFO - __main__ - Step 14086: {'lr': 0.0004918191824235335, 'samples': 2704512, 'steps': 14085, 'loss/train': 1.54026198387146} +11/06/2021 23:11:32 - INFO - __main__ - Step 14087: {'lr': 0.0004918178359221147, 'samples': 2704704, 'steps': 14086, 'loss/train': 2.31728196144104} +11/06/2021 23:11:33 - INFO - __main__ - Step 14088: {'lr': 0.0004918164893117366, 'samples': 2704896, 'steps': 14087, 'loss/train': 1.713340401649475} +11/06/2021 23:11:34 - INFO - __main__ - Step 14089: {'lr': 0.0004918151425923996, 'samples': 2705088, 'steps': 14088, 'loss/train': 1.4485218524932861} +11/06/2021 23:11:34 - INFO - __main__ - Step 14090: {'lr': 0.0004918137957641046, 'samples': 2705280, 'steps': 14089, 'loss/train': 1.635068416595459} +11/06/2021 23:11:34 - INFO - __main__ - Step 14091: {'lr': 0.000491812448826852, 'samples': 2705472, 'steps': 14090, 'loss/train': 1.8842805624008179} +11/06/2021 23:11:35 - INFO - __main__ - Step 14092: {'lr': 0.0004918111017806424, 'samples': 2705664, 'steps': 14091, 'loss/train': 1.5843989849090576} +11/06/2021 23:11:35 - INFO - __main__ - Step 14093: {'lr': 0.0004918097546254764, 'samples': 2705856, 'steps': 14092, 'loss/train': 1.812479019165039} +11/06/2021 23:11:36 - INFO - __main__ - Step 14094: {'lr': 0.0004918084073613547, 'samples': 2706048, 'steps': 14093, 'loss/train': 1.6815907955169678} +11/06/2021 23:11:36 - INFO - __main__ - Step 14095: {'lr': 0.0004918070599882778, 'samples': 2706240, 'steps': 14094, 'loss/train': 1.7472896575927734} +11/06/2021 23:11:37 - INFO - __main__ - Step 14096: {'lr': 0.0004918057125062465, 'samples': 2706432, 'steps': 14095, 'loss/train': 1.8674776554107666} +11/06/2021 23:11:37 - INFO - __main__ - Step 14097: {'lr': 0.0004918043649152612, 'samples': 2706624, 'steps': 14096, 'loss/train': 1.9627310037612915} +11/06/2021 23:11:37 - INFO - __main__ - Step 14098: {'lr': 0.0004918030172153225, 'samples': 2706816, 'steps': 14097, 'loss/train': 1.6795316934585571} +11/06/2021 23:11:38 - INFO - __main__ - Step 14099: {'lr': 0.0004918016694064313, 'samples': 2707008, 'steps': 14098, 'loss/train': 1.9474259614944458} +11/06/2021 23:11:39 - INFO - __main__ - Step 14100: {'lr': 0.0004918003214885877, 'samples': 2707200, 'steps': 14099, 'loss/train': 1.1974012851715088} +11/06/2021 23:11:39 - INFO - __main__ - Step 14101: {'lr': 0.0004917989734617928, 'samples': 2707392, 'steps': 14100, 'loss/train': 1.9953140020370483} +11/06/2021 23:11:39 - INFO - __main__ - Step 14102: {'lr': 0.0004917976253260471, 'samples': 2707584, 'steps': 14101, 'loss/train': 1.6123121976852417} +11/06/2021 23:11:40 - INFO - __main__ - Step 14103: {'lr': 0.000491796277081351, 'samples': 2707776, 'steps': 14102, 'loss/train': 1.817934274673462} +11/06/2021 23:11:40 - INFO - __main__ - Step 14104: {'lr': 0.0004917949287277052, 'samples': 2707968, 'steps': 14103, 'loss/train': 2.0339081287384033} +11/06/2021 23:11:41 - INFO - __main__ - Step 14105: {'lr': 0.0004917935802651104, 'samples': 2708160, 'steps': 14104, 'loss/train': 1.8835687637329102} +11/06/2021 23:11:42 - INFO - __main__ - Step 14106: {'lr': 0.0004917922316935671, 'samples': 2708352, 'steps': 14105, 'loss/train': 1.9598747491836548} +11/06/2021 23:11:42 - INFO - __main__ - Step 14107: {'lr': 0.000491790883013076, 'samples': 2708544, 'steps': 14106, 'loss/train': 1.3012551069259644} +11/06/2021 23:11:42 - INFO - __main__ - Step 14108: {'lr': 0.0004917895342236377, 'samples': 2708736, 'steps': 14107, 'loss/train': 1.5593042373657227} +11/06/2021 23:11:43 - INFO - __main__ - Step 14109: {'lr': 0.0004917881853252527, 'samples': 2708928, 'steps': 14108, 'loss/train': 1.7348185777664185} +11/06/2021 23:11:44 - INFO - __main__ - Step 14110: {'lr': 0.0004917868363179216, 'samples': 2709120, 'steps': 14109, 'loss/train': 2.0034899711608887} +11/06/2021 23:11:44 - INFO - __main__ - Step 14111: {'lr': 0.0004917854872016451, 'samples': 2709312, 'steps': 14110, 'loss/train': 1.7014143466949463} +11/06/2021 23:11:44 - INFO - __main__ - Step 14112: {'lr': 0.000491784137976424, 'samples': 2709504, 'steps': 14111, 'loss/train': 0.5290675163269043} +11/06/2021 23:11:45 - INFO - __main__ - Step 14113: {'lr': 0.0004917827886422586, 'samples': 2709696, 'steps': 14112, 'loss/train': 1.854404330253601} +11/06/2021 23:11:45 - INFO - __main__ - Step 14114: {'lr': 0.0004917814391991494, 'samples': 2709888, 'steps': 14113, 'loss/train': 1.8280285596847534} +11/06/2021 23:11:46 - INFO - __main__ - Step 14115: {'lr': 0.0004917800896470974, 'samples': 2710080, 'steps': 14114, 'loss/train': 1.9659100770950317} +11/06/2021 23:11:46 - INFO - __main__ - Step 14116: {'lr': 0.000491778739986103, 'samples': 2710272, 'steps': 14115, 'loss/train': 2.029839515686035} +11/06/2021 23:11:47 - INFO - __main__ - Step 14117: {'lr': 0.0004917773902161669, 'samples': 2710464, 'steps': 14116, 'loss/train': 1.8698660135269165} +11/06/2021 23:11:47 - INFO - __main__ - Step 14118: {'lr': 0.0004917760403372895, 'samples': 2710656, 'steps': 14117, 'loss/train': 1.1892834901809692} +11/06/2021 23:11:47 - INFO - __main__ - Step 14119: {'lr': 0.0004917746903494717, 'samples': 2710848, 'steps': 14118, 'loss/train': 0.9476760029792786} +11/06/2021 23:11:48 - INFO - __main__ - Step 14120: {'lr': 0.0004917733402527138, 'samples': 2711040, 'steps': 14119, 'loss/train': 1.6532700061798096} +11/06/2021 23:11:49 - INFO - __main__ - Step 14121: {'lr': 0.0004917719900470167, 'samples': 2711232, 'steps': 14120, 'loss/train': 1.880062222480774} +11/06/2021 23:11:49 - INFO - __main__ - Step 14122: {'lr': 0.0004917706397323808, 'samples': 2711424, 'steps': 14121, 'loss/train': 2.203761100769043} +11/06/2021 23:11:49 - INFO - __main__ - Step 14123: {'lr': 0.0004917692893088067, 'samples': 2711616, 'steps': 14122, 'loss/train': 1.9275217056274414} +11/06/2021 23:11:50 - INFO - __main__ - Step 14124: {'lr': 0.0004917679387762952, 'samples': 2711808, 'steps': 14123, 'loss/train': 1.9265042543411255} +11/06/2021 23:11:51 - INFO - __main__ - Step 14125: {'lr': 0.0004917665881348467, 'samples': 2712000, 'steps': 14124, 'loss/train': 1.2948485612869263} +11/06/2021 23:11:51 - INFO - __main__ - Step 14126: {'lr': 0.000491765237384462, 'samples': 2712192, 'steps': 14125, 'loss/train': 1.6665414571762085} +11/06/2021 23:11:52 - INFO - __main__ - Step 14127: {'lr': 0.0004917638865251416, 'samples': 2712384, 'steps': 14126, 'loss/train': 0.629708468914032} +11/06/2021 23:11:52 - INFO - __main__ - Step 14128: {'lr': 0.0004917625355568861, 'samples': 2712576, 'steps': 14127, 'loss/train': 1.6347920894622803} +11/06/2021 23:11:53 - INFO - __main__ - Step 14129: {'lr': 0.0004917611844796962, 'samples': 2712768, 'steps': 14128, 'loss/train': 1.388734221458435} +11/06/2021 23:11:54 - INFO - __main__ - Step 14130: {'lr': 0.0004917598332935724, 'samples': 2712960, 'steps': 14129, 'loss/train': 1.3727388381958008} +11/06/2021 23:11:54 - INFO - __main__ - Step 14131: {'lr': 0.0004917584819985153, 'samples': 2713152, 'steps': 14130, 'loss/train': 1.5905683040618896} +11/06/2021 23:11:54 - INFO - __main__ - Step 14132: {'lr': 0.0004917571305945256, 'samples': 2713344, 'steps': 14131, 'loss/train': 1.9821319580078125} +11/06/2021 23:11:55 - INFO - __main__ - Step 14133: {'lr': 0.0004917557790816039, 'samples': 2713536, 'steps': 14132, 'loss/train': 1.3257533311843872} +11/06/2021 23:11:55 - INFO - __main__ - Step 14134: {'lr': 0.0004917544274597507, 'samples': 2713728, 'steps': 14133, 'loss/train': 1.8089780807495117} +11/06/2021 23:11:56 - INFO - __main__ - Step 14135: {'lr': 0.0004917530757289668, 'samples': 2713920, 'steps': 14134, 'loss/train': 1.6792985200881958} +11/06/2021 23:11:56 - INFO - __main__ - Step 14136: {'lr': 0.0004917517238892526, 'samples': 2714112, 'steps': 14135, 'loss/train': 1.4552292823791504} +11/06/2021 23:11:57 - INFO - __main__ - Step 14137: {'lr': 0.0004917503719406087, 'samples': 2714304, 'steps': 14136, 'loss/train': 1.8645858764648438} +11/06/2021 23:11:57 - INFO - __main__ - Step 14138: {'lr': 0.000491749019883036, 'samples': 2714496, 'steps': 14137, 'loss/train': 1.6772507429122925} +11/06/2021 23:11:58 - INFO - __main__ - Step 14139: {'lr': 0.0004917476677165349, 'samples': 2714688, 'steps': 14138, 'loss/train': 1.839224100112915} +11/06/2021 23:11:58 - INFO - __main__ - Step 14140: {'lr': 0.0004917463154411059, 'samples': 2714880, 'steps': 14139, 'loss/train': 1.2386482954025269} +11/06/2021 23:11:59 - INFO - __main__ - Step 14141: {'lr': 0.0004917449630567499, 'samples': 2715072, 'steps': 14140, 'loss/train': 1.9079393148422241} +11/06/2021 23:11:59 - INFO - __main__ - Step 14142: {'lr': 0.0004917436105634673, 'samples': 2715264, 'steps': 14141, 'loss/train': 1.7619988918304443} +11/06/2021 23:12:00 - INFO - __main__ - Step 14143: {'lr': 0.0004917422579612587, 'samples': 2715456, 'steps': 14142, 'loss/train': 1.625560998916626} +11/06/2021 23:12:00 - INFO - __main__ - Step 14144: {'lr': 0.0004917409052501248, 'samples': 2715648, 'steps': 14143, 'loss/train': 1.4624155759811401} +11/06/2021 23:12:00 - INFO - __main__ - Step 14145: {'lr': 0.0004917395524300661, 'samples': 2715840, 'steps': 14144, 'loss/train': 1.0638208389282227} +11/06/2021 23:12:02 - INFO - __main__ - Step 14146: {'lr': 0.0004917381995010834, 'samples': 2716032, 'steps': 14145, 'loss/train': 1.523756980895996} +11/06/2021 23:12:02 - INFO - __main__ - Step 14147: {'lr': 0.0004917368464631772, 'samples': 2716224, 'steps': 14146, 'loss/train': 1.4266034364700317} +11/06/2021 23:12:02 - INFO - __main__ - Step 14148: {'lr': 0.0004917354933163481, 'samples': 2716416, 'steps': 14147, 'loss/train': 2.06866455078125} +11/06/2021 23:12:03 - INFO - __main__ - Step 14149: {'lr': 0.0004917341400605967, 'samples': 2716608, 'steps': 14148, 'loss/train': 1.4128144979476929} +11/06/2021 23:12:03 - INFO - __main__ - Step 14150: {'lr': 0.0004917327866959236, 'samples': 2716800, 'steps': 14149, 'loss/train': 1.0061789751052856} +11/06/2021 23:12:04 - INFO - __main__ - Step 14151: {'lr': 0.0004917314332223295, 'samples': 2716992, 'steps': 14150, 'loss/train': 1.8678841590881348} +11/06/2021 23:12:04 - INFO - __main__ - Step 14152: {'lr': 0.0004917300796398148, 'samples': 2717184, 'steps': 14151, 'loss/train': 1.5144931077957153} +11/06/2021 23:12:05 - INFO - __main__ - Step 14153: {'lr': 0.0004917287259483805, 'samples': 2717376, 'steps': 14152, 'loss/train': 1.836294412612915} +11/06/2021 23:12:05 - INFO - __main__ - Step 14154: {'lr': 0.0004917273721480268, 'samples': 2717568, 'steps': 14153, 'loss/train': 1.3567187786102295} +11/06/2021 23:12:05 - INFO - __main__ - Step 14155: {'lr': 0.0004917260182387545, 'samples': 2717760, 'steps': 14154, 'loss/train': 1.4603012800216675} +11/06/2021 23:12:07 - INFO - __main__ - Step 14156: {'lr': 0.0004917246642205642, 'samples': 2717952, 'steps': 14155, 'loss/train': 1.4038804769515991} +11/06/2021 23:12:07 - INFO - __main__ - Step 14157: {'lr': 0.0004917233100934565, 'samples': 2718144, 'steps': 14156, 'loss/train': 1.8869411945343018} +11/06/2021 23:12:07 - INFO - __main__ - Step 14158: {'lr': 0.0004917219558574319, 'samples': 2718336, 'steps': 14157, 'loss/train': 1.7700613737106323} +11/06/2021 23:12:08 - INFO - __main__ - Step 14159: {'lr': 0.0004917206015124913, 'samples': 2718528, 'steps': 14158, 'loss/train': 0.9594613313674927} +11/06/2021 23:12:08 - INFO - __main__ - Step 14160: {'lr': 0.000491719247058635, 'samples': 2718720, 'steps': 14159, 'loss/train': 1.2669697999954224} +11/06/2021 23:12:08 - INFO - __main__ - Step 14161: {'lr': 0.0004917178924958638, 'samples': 2718912, 'steps': 14160, 'loss/train': 2.0762956142425537} +11/06/2021 23:12:09 - INFO - __main__ - Step 14162: {'lr': 0.0004917165378241782, 'samples': 2719104, 'steps': 14161, 'loss/train': 1.8425633907318115} +11/06/2021 23:12:10 - INFO - __main__ - Step 14163: {'lr': 0.0004917151830435789, 'samples': 2719296, 'steps': 14162, 'loss/train': 1.3636668920516968} +11/06/2021 23:12:10 - INFO - __main__ - Step 14164: {'lr': 0.0004917138281540664, 'samples': 2719488, 'steps': 14163, 'loss/train': 2.4625284671783447} +11/06/2021 23:12:10 - INFO - __main__ - Step 14165: {'lr': 0.0004917124731556415, 'samples': 2719680, 'steps': 14164, 'loss/train': 2.0274415016174316} +11/06/2021 23:12:11 - INFO - __main__ - Step 14166: {'lr': 0.0004917111180483046, 'samples': 2719872, 'steps': 14165, 'loss/train': 1.421899676322937} +11/06/2021 23:12:12 - INFO - __main__ - Step 14167: {'lr': 0.0004917097628320564, 'samples': 2720064, 'steps': 14166, 'loss/train': 1.8181909322738647} +11/06/2021 23:12:12 - INFO - __main__ - Step 14168: {'lr': 0.0004917084075068975, 'samples': 2720256, 'steps': 14167, 'loss/train': 1.8530933856964111} +11/06/2021 23:12:12 - INFO - __main__ - Step 14169: {'lr': 0.0004917070520728286, 'samples': 2720448, 'steps': 14168, 'loss/train': 1.7252720594406128} +11/06/2021 23:12:13 - INFO - __main__ - Step 14170: {'lr': 0.0004917056965298501, 'samples': 2720640, 'steps': 14169, 'loss/train': 1.3021842241287231} +11/06/2021 23:12:13 - INFO - __main__ - Step 14171: {'lr': 0.0004917043408779629, 'samples': 2720832, 'steps': 14170, 'loss/train': 1.746435523033142} +11/06/2021 23:12:14 - INFO - __main__ - Step 14172: {'lr': 0.0004917029851171674, 'samples': 2721024, 'steps': 14171, 'loss/train': 0.15152797102928162} +11/06/2021 23:12:15 - INFO - __main__ - Step 14173: {'lr': 0.0004917016292474642, 'samples': 2721216, 'steps': 14172, 'loss/train': 2.0078635215759277} +11/06/2021 23:12:15 - INFO - __main__ - Step 14174: {'lr': 0.000491700273268854, 'samples': 2721408, 'steps': 14173, 'loss/train': 1.525383472442627} +11/06/2021 23:12:15 - INFO - __main__ - Step 14175: {'lr': 0.0004916989171813374, 'samples': 2721600, 'steps': 14174, 'loss/train': 1.6893455982208252} +11/06/2021 23:12:16 - INFO - __main__ - Step 14176: {'lr': 0.000491697560984915, 'samples': 2721792, 'steps': 14175, 'loss/train': 1.4403749704360962} +11/06/2021 23:12:17 - INFO - __main__ - Step 14177: {'lr': 0.0004916962046795874, 'samples': 2721984, 'steps': 14176, 'loss/train': 2.55890154838562} +11/06/2021 23:12:17 - INFO - __main__ - Step 14178: {'lr': 0.0004916948482653553, 'samples': 2722176, 'steps': 14177, 'loss/train': 1.7743308544158936} +11/06/2021 23:12:17 - INFO - __main__ - Step 14179: {'lr': 0.0004916934917422191, 'samples': 2722368, 'steps': 14178, 'loss/train': 1.5195140838623047} +11/06/2021 23:12:18 - INFO - __main__ - Step 14180: {'lr': 0.0004916921351101796, 'samples': 2722560, 'steps': 14179, 'loss/train': 1.529984951019287} +11/06/2021 23:12:18 - INFO - __main__ - Step 14181: {'lr': 0.0004916907783692374, 'samples': 2722752, 'steps': 14180, 'loss/train': 1.9970260858535767} +11/06/2021 23:12:18 - INFO - __main__ - Step 14182: {'lr': 0.000491689421519393, 'samples': 2722944, 'steps': 14181, 'loss/train': 1.5570197105407715} +11/06/2021 23:12:19 - INFO - __main__ - Step 14183: {'lr': 0.0004916880645606471, 'samples': 2723136, 'steps': 14182, 'loss/train': 1.396638035774231} +11/06/2021 23:12:20 - INFO - __main__ - Step 14184: {'lr': 0.0004916867074930002, 'samples': 2723328, 'steps': 14183, 'loss/train': 1.960241436958313} +11/06/2021 23:12:20 - INFO - __main__ - Step 14185: {'lr': 0.0004916853503164531, 'samples': 2723520, 'steps': 14184, 'loss/train': 1.312820553779602} +11/06/2021 23:12:20 - INFO - __main__ - Step 14186: {'lr': 0.0004916839930310063, 'samples': 2723712, 'steps': 14185, 'loss/train': 1.5989493131637573} +11/06/2021 23:12:21 - INFO - __main__ - Step 14187: {'lr': 0.0004916826356366605, 'samples': 2723904, 'steps': 14186, 'loss/train': 2.3531341552734375} +11/06/2021 23:12:22 - INFO - __main__ - Step 14188: {'lr': 0.0004916812781334161, 'samples': 2724096, 'steps': 14187, 'loss/train': 1.5331050157546997} +11/06/2021 23:12:22 - INFO - __main__ - Step 14189: {'lr': 0.0004916799205212739, 'samples': 2724288, 'steps': 14188, 'loss/train': 1.6796480417251587} +11/06/2021 23:12:23 - INFO - __main__ - Step 14190: {'lr': 0.0004916785628002345, 'samples': 2724480, 'steps': 14189, 'loss/train': 1.338007926940918} +11/06/2021 23:12:23 - INFO - __main__ - Step 14191: {'lr': 0.0004916772049702984, 'samples': 2724672, 'steps': 14190, 'loss/train': 2.13338565826416} +11/06/2021 23:12:23 - INFO - __main__ - Step 14192: {'lr': 0.0004916758470314662, 'samples': 2724864, 'steps': 14191, 'loss/train': 1.8545008897781372} +11/06/2021 23:12:24 - INFO - __main__ - Step 14193: {'lr': 0.0004916744889837388, 'samples': 2725056, 'steps': 14192, 'loss/train': 1.7253385782241821} +11/06/2021 23:12:25 - INFO - __main__ - Step 14194: {'lr': 0.0004916731308271165, 'samples': 2725248, 'steps': 14193, 'loss/train': 1.8852863311767578} +11/06/2021 23:12:25 - INFO - __main__ - Step 14195: {'lr': 0.0004916717725616, 'samples': 2725440, 'steps': 14194, 'loss/train': 1.7347588539123535} +11/06/2021 23:12:25 - INFO - __main__ - Step 14196: {'lr': 0.0004916704141871899, 'samples': 2725632, 'steps': 14195, 'loss/train': 1.6380163431167603} +11/06/2021 23:12:26 - INFO - __main__ - Step 14197: {'lr': 0.000491669055703887, 'samples': 2725824, 'steps': 14196, 'loss/train': 1.5754060745239258} +11/06/2021 23:12:27 - INFO - __main__ - Step 14198: {'lr': 0.0004916676971116916, 'samples': 2726016, 'steps': 14197, 'loss/train': 1.435011863708496} +11/06/2021 23:12:27 - INFO - __main__ - Step 14199: {'lr': 0.0004916663384106045, 'samples': 2726208, 'steps': 14198, 'loss/train': 1.975164771080017} +11/06/2021 23:12:28 - INFO - __main__ - Step 14200: {'lr': 0.0004916649796006263, 'samples': 2726400, 'steps': 14199, 'loss/train': 1.1312105655670166} +11/06/2021 23:12:28 - INFO - __main__ - Step 14201: {'lr': 0.0004916636206817575, 'samples': 2726592, 'steps': 14200, 'loss/train': 1.805939793586731} +11/06/2021 23:12:28 - INFO - __main__ - Step 14202: {'lr': 0.0004916622616539988, 'samples': 2726784, 'steps': 14201, 'loss/train': 1.1680221557617188} +11/06/2021 23:12:29 - INFO - __main__ - Step 14203: {'lr': 0.000491660902517351, 'samples': 2726976, 'steps': 14202, 'loss/train': 1.5965232849121094} +11/06/2021 23:12:30 - INFO - __main__ - Step 14204: {'lr': 0.0004916595432718143, 'samples': 2727168, 'steps': 14203, 'loss/train': 1.660688877105713} +11/06/2021 23:12:30 - INFO - __main__ - Step 14205: {'lr': 0.0004916581839173897, 'samples': 2727360, 'steps': 14204, 'loss/train': 2.3039207458496094} +11/06/2021 23:12:31 - INFO - __main__ - Step 14206: {'lr': 0.0004916568244540776, 'samples': 2727552, 'steps': 14205, 'loss/train': 1.4516968727111816} +11/06/2021 23:12:31 - INFO - __main__ - Step 14207: {'lr': 0.0004916554648818787, 'samples': 2727744, 'steps': 14206, 'loss/train': 1.7223396301269531} +11/06/2021 23:12:31 - INFO - __main__ - Step 14208: {'lr': 0.0004916541052007936, 'samples': 2727936, 'steps': 14207, 'loss/train': 1.0482618808746338} +11/06/2021 23:12:32 - INFO - __main__ - Step 14209: {'lr': 0.0004916527454108227, 'samples': 2728128, 'steps': 14208, 'loss/train': 1.7698308229446411} +11/06/2021 23:12:33 - INFO - __main__ - Step 14210: {'lr': 0.0004916513855119669, 'samples': 2728320, 'steps': 14209, 'loss/train': 2.295707941055298} +11/06/2021 23:12:33 - INFO - __main__ - Step 14211: {'lr': 0.0004916500255042268, 'samples': 2728512, 'steps': 14210, 'loss/train': 1.637235164642334} +11/06/2021 23:12:33 - INFO - __main__ - Step 14212: {'lr': 0.0004916486653876029, 'samples': 2728704, 'steps': 14211, 'loss/train': 1.552703619003296} +11/06/2021 23:12:34 - INFO - __main__ - Step 14213: {'lr': 0.0004916473051620958, 'samples': 2728896, 'steps': 14212, 'loss/train': 2.0507657527923584} +11/06/2021 23:12:35 - INFO - __main__ - Step 14214: {'lr': 0.0004916459448277062, 'samples': 2729088, 'steps': 14213, 'loss/train': 2.118166446685791} +11/06/2021 23:12:35 - INFO - __main__ - Step 14215: {'lr': 0.0004916445843844346, 'samples': 2729280, 'steps': 14214, 'loss/train': 1.8859989643096924} +11/06/2021 23:12:36 - INFO - __main__ - Step 14216: {'lr': 0.0004916432238322818, 'samples': 2729472, 'steps': 14215, 'loss/train': 1.5724775791168213} +11/06/2021 23:12:36 - INFO - __main__ - Step 14217: {'lr': 0.0004916418631712481, 'samples': 2729664, 'steps': 14216, 'loss/train': 1.3125375509262085} +11/06/2021 23:12:36 - INFO - __main__ - Step 14218: {'lr': 0.0004916405024013344, 'samples': 2729856, 'steps': 14217, 'loss/train': 1.8595951795578003} +11/06/2021 23:12:37 - INFO - __main__ - Step 14219: {'lr': 0.0004916391415225413, 'samples': 2730048, 'steps': 14218, 'loss/train': 1.1561071872711182} +11/06/2021 23:12:38 - INFO - __main__ - Step 14220: {'lr': 0.0004916377805348692, 'samples': 2730240, 'steps': 14219, 'loss/train': 1.8915315866470337} +11/06/2021 23:12:38 - INFO - __main__ - Step 14221: {'lr': 0.000491636419438319, 'samples': 2730432, 'steps': 14220, 'loss/train': 1.322358250617981} +11/06/2021 23:12:38 - INFO - __main__ - Step 14222: {'lr': 0.000491635058232891, 'samples': 2730624, 'steps': 14221, 'loss/train': 1.5473992824554443} +11/06/2021 23:12:39 - INFO - __main__ - Step 14223: {'lr': 0.0004916336969185861, 'samples': 2730816, 'steps': 14222, 'loss/train': 0.6478114724159241} +11/06/2021 23:12:40 - INFO - __main__ - Step 14224: {'lr': 0.0004916323354954047, 'samples': 2731008, 'steps': 14223, 'loss/train': 1.2803329229354858} +11/06/2021 23:12:40 - INFO - __main__ - Step 14225: {'lr': 0.0004916309739633475, 'samples': 2731200, 'steps': 14224, 'loss/train': 1.5547466278076172} +11/06/2021 23:12:40 - INFO - __main__ - Step 14226: {'lr': 0.0004916296123224151, 'samples': 2731392, 'steps': 14225, 'loss/train': 2.0657129287719727} +11/06/2021 23:12:41 - INFO - __main__ - Step 14227: {'lr': 0.0004916282505726082, 'samples': 2731584, 'steps': 14226, 'loss/train': 1.7537693977355957} +11/06/2021 23:12:41 - INFO - __main__ - Step 14228: {'lr': 0.0004916268887139272, 'samples': 2731776, 'steps': 14227, 'loss/train': 1.8315138816833496} +11/06/2021 23:12:42 - INFO - __main__ - Step 14229: {'lr': 0.000491625526746373, 'samples': 2731968, 'steps': 14228, 'loss/train': 2.130446434020996} +11/06/2021 23:12:43 - INFO - __main__ - Step 14230: {'lr': 0.000491624164669946, 'samples': 2732160, 'steps': 14229, 'loss/train': 2.0926835536956787} +11/06/2021 23:12:43 - INFO - __main__ - Step 14231: {'lr': 0.0004916228024846469, 'samples': 2732352, 'steps': 14230, 'loss/train': 1.9206883907318115} +11/06/2021 23:12:43 - INFO - __main__ - Step 14232: {'lr': 0.0004916214401904763, 'samples': 2732544, 'steps': 14231, 'loss/train': 1.461196780204773} +11/06/2021 23:12:44 - INFO - __main__ - Step 14233: {'lr': 0.0004916200777874348, 'samples': 2732736, 'steps': 14232, 'loss/train': 1.8770463466644287} +11/06/2021 23:12:45 - INFO - __main__ - Step 14234: {'lr': 0.000491618715275523, 'samples': 2732928, 'steps': 14233, 'loss/train': 2.0279908180236816} +11/06/2021 23:12:46 - INFO - __main__ - Step 14235: {'lr': 0.0004916173526547415, 'samples': 2733120, 'steps': 14234, 'loss/train': 1.2167682647705078} +11/06/2021 23:12:46 - INFO - __main__ - Step 14236: {'lr': 0.000491615989925091, 'samples': 2733312, 'steps': 14235, 'loss/train': 1.5853732824325562} +11/06/2021 23:12:46 - INFO - __main__ - Step 14237: {'lr': 0.0004916146270865721, 'samples': 2733504, 'steps': 14236, 'loss/train': 2.5321567058563232} +11/06/2021 23:12:47 - INFO - __main__ - Step 14238: {'lr': 0.0004916132641391854, 'samples': 2733696, 'steps': 14237, 'loss/train': 1.8508648872375488} +11/06/2021 23:12:47 - INFO - __main__ - Step 14239: {'lr': 0.0004916119010829314, 'samples': 2733888, 'steps': 14238, 'loss/train': 1.860944390296936} +11/06/2021 23:12:47 - INFO - __main__ - Step 14240: {'lr': 0.0004916105379178108, 'samples': 2734080, 'steps': 14239, 'loss/train': 1.910184621810913} +11/06/2021 23:12:48 - INFO - __main__ - Step 14241: {'lr': 0.0004916091746438243, 'samples': 2734272, 'steps': 14240, 'loss/train': 1.9223930835723877} +11/06/2021 23:12:49 - INFO - __main__ - Step 14242: {'lr': 0.0004916078112609724, 'samples': 2734464, 'steps': 14241, 'loss/train': 1.7084510326385498} +11/06/2021 23:12:49 - INFO - __main__ - Step 14243: {'lr': 0.0004916064477692557, 'samples': 2734656, 'steps': 14242, 'loss/train': 0.43883585929870605} +11/06/2021 23:12:49 - INFO - __main__ - Step 14244: {'lr': 0.0004916050841686748, 'samples': 2734848, 'steps': 14243, 'loss/train': 1.6944113969802856} +11/06/2021 23:12:50 - INFO - __main__ - Step 14245: {'lr': 0.0004916037204592306, 'samples': 2735040, 'steps': 14244, 'loss/train': 1.1687214374542236} +11/06/2021 23:12:51 - INFO - __main__ - Step 14246: {'lr': 0.0004916023566409233, 'samples': 2735232, 'steps': 14245, 'loss/train': 2.218296766281128} +11/06/2021 23:12:51 - INFO - __main__ - Step 14247: {'lr': 0.0004916009927137538, 'samples': 2735424, 'steps': 14246, 'loss/train': 1.7040735483169556} +11/06/2021 23:12:52 - INFO - __main__ - Step 14248: {'lr': 0.0004915996286777226, 'samples': 2735616, 'steps': 14247, 'loss/train': 1.2565326690673828} +11/06/2021 23:12:52 - INFO - __main__ - Step 14249: {'lr': 0.0004915982645328304, 'samples': 2735808, 'steps': 14248, 'loss/train': 1.6930842399597168} +11/06/2021 23:12:52 - INFO - __main__ - Step 14250: {'lr': 0.0004915969002790777, 'samples': 2736000, 'steps': 14249, 'loss/train': 1.771859049797058} +11/06/2021 23:12:53 - INFO - __main__ - Step 14251: {'lr': 0.0004915955359164651, 'samples': 2736192, 'steps': 14250, 'loss/train': 1.4663689136505127} +11/06/2021 23:12:54 - INFO - __main__ - Step 14252: {'lr': 0.0004915941714449933, 'samples': 2736384, 'steps': 14251, 'loss/train': 1.6903026103973389} +11/06/2021 23:12:54 - INFO - __main__ - Step 14253: {'lr': 0.000491592806864663, 'samples': 2736576, 'steps': 14252, 'loss/train': 1.7190121412277222} +11/06/2021 23:12:54 - INFO - __main__ - Step 14254: {'lr': 0.0004915914421754746, 'samples': 2736768, 'steps': 14253, 'loss/train': 0.6711317300796509} +11/06/2021 23:12:55 - INFO - __main__ - Step 14255: {'lr': 0.0004915900773774289, 'samples': 2736960, 'steps': 14254, 'loss/train': 1.9526695013046265} +11/06/2021 23:12:55 - INFO - __main__ - Step 14256: {'lr': 0.0004915887124705263, 'samples': 2737152, 'steps': 14255, 'loss/train': 2.055246353149414} +11/06/2021 23:12:56 - INFO - __main__ - Step 14257: {'lr': 0.0004915873474547677, 'samples': 2737344, 'steps': 14256, 'loss/train': 1.7780791521072388} +11/06/2021 23:12:57 - INFO - __main__ - Step 14258: {'lr': 0.0004915859823301535, 'samples': 2737536, 'steps': 14257, 'loss/train': 1.91822350025177} +11/06/2021 23:12:57 - INFO - __main__ - Step 14259: {'lr': 0.0004915846170966845, 'samples': 2737728, 'steps': 14258, 'loss/train': 1.2504817247390747} +11/06/2021 23:12:57 - INFO - __main__ - Step 14260: {'lr': 0.000491583251754361, 'samples': 2737920, 'steps': 14259, 'loss/train': 2.1529762744903564} +11/06/2021 23:12:58 - INFO - __main__ - Step 14261: {'lr': 0.0004915818863031839, 'samples': 2738112, 'steps': 14260, 'loss/train': 2.2141220569610596} +11/06/2021 23:12:58 - INFO - __main__ - Step 14262: {'lr': 0.0004915805207431537, 'samples': 2738304, 'steps': 14261, 'loss/train': 1.4041943550109863} +11/06/2021 23:12:59 - INFO - __main__ - Step 14263: {'lr': 0.0004915791550742712, 'samples': 2738496, 'steps': 14262, 'loss/train': 2.012119770050049} +11/06/2021 23:12:59 - INFO - __main__ - Step 14264: {'lr': 0.0004915777892965368, 'samples': 2738688, 'steps': 14263, 'loss/train': 1.8272478580474854} +11/06/2021 23:13:00 - INFO - __main__ - Step 14265: {'lr': 0.0004915764234099511, 'samples': 2738880, 'steps': 14264, 'loss/train': 1.6100664138793945} +11/06/2021 23:13:00 - INFO - __main__ - Step 14266: {'lr': 0.0004915750574145148, 'samples': 2739072, 'steps': 14265, 'loss/train': 1.9792180061340332} +11/06/2021 23:13:00 - INFO - __main__ - Step 14267: {'lr': 0.0004915736913102285, 'samples': 2739264, 'steps': 14266, 'loss/train': 1.8761942386627197} +11/06/2021 23:13:02 - INFO - __main__ - Step 14268: {'lr': 0.0004915723250970928, 'samples': 2739456, 'steps': 14267, 'loss/train': 2.067959785461426} +11/06/2021 23:13:02 - INFO - __main__ - Step 14269: {'lr': 0.0004915709587751084, 'samples': 2739648, 'steps': 14268, 'loss/train': 2.4542698860168457} +11/06/2021 23:13:02 - INFO - __main__ - Step 14270: {'lr': 0.0004915695923442759, 'samples': 2739840, 'steps': 14269, 'loss/train': 1.489783763885498} +11/06/2021 23:13:03 - INFO - __main__ - Step 14271: {'lr': 0.0004915682258045958, 'samples': 2740032, 'steps': 14270, 'loss/train': 1.8175733089447021} +11/06/2021 23:13:03 - INFO - __main__ - Step 14272: {'lr': 0.0004915668591560688, 'samples': 2740224, 'steps': 14271, 'loss/train': 1.3902310132980347} +11/06/2021 23:13:04 - INFO - __main__ - Step 14273: {'lr': 0.0004915654923986955, 'samples': 2740416, 'steps': 14272, 'loss/train': 1.5795223712921143} +11/06/2021 23:13:04 - INFO - __main__ - Step 14274: {'lr': 0.0004915641255324764, 'samples': 2740608, 'steps': 14273, 'loss/train': 1.8649059534072876} +11/06/2021 23:13:05 - INFO - __main__ - Step 14275: {'lr': 0.0004915627585574124, 'samples': 2740800, 'steps': 14274, 'loss/train': 1.643608570098877} +11/06/2021 23:13:05 - INFO - __main__ - Step 14276: {'lr': 0.0004915613914735038, 'samples': 2740992, 'steps': 14275, 'loss/train': 2.0051262378692627} +11/06/2021 23:13:05 - INFO - __main__ - Step 14277: {'lr': 0.0004915600242807516, 'samples': 2741184, 'steps': 14276, 'loss/train': 1.455479383468628} +11/06/2021 23:13:06 - INFO - __main__ - Step 14278: {'lr': 0.000491558656979156, 'samples': 2741376, 'steps': 14277, 'loss/train': 1.6889221668243408} +11/06/2021 23:13:07 - INFO - __main__ - Step 14279: {'lr': 0.0004915572895687179, 'samples': 2741568, 'steps': 14278, 'loss/train': 1.9221125841140747} +11/06/2021 23:13:07 - INFO - __main__ - Step 14280: {'lr': 0.0004915559220494376, 'samples': 2741760, 'steps': 14279, 'loss/train': 1.842481017112732} +11/06/2021 23:13:07 - INFO - __main__ - Step 14281: {'lr': 0.0004915545544213161, 'samples': 2741952, 'steps': 14280, 'loss/train': 1.5338388681411743} +11/06/2021 23:13:08 - INFO - __main__ - Step 14282: {'lr': 0.0004915531866843539, 'samples': 2742144, 'steps': 14281, 'loss/train': 1.903611660003662} +11/06/2021 23:13:09 - INFO - __main__ - Step 14283: {'lr': 0.0004915518188385514, 'samples': 2742336, 'steps': 14282, 'loss/train': 1.557709813117981} +11/06/2021 23:13:09 - INFO - __main__ - Step 14284: {'lr': 0.0004915504508839095, 'samples': 2742528, 'steps': 14283, 'loss/train': 1.7310574054718018} +11/06/2021 23:13:09 - INFO - __main__ - Step 14285: {'lr': 0.0004915490828204287, 'samples': 2742720, 'steps': 14284, 'loss/train': 1.8797122240066528} +11/06/2021 23:13:10 - INFO - __main__ - Step 14286: {'lr': 0.0004915477146481095, 'samples': 2742912, 'steps': 14285, 'loss/train': 1.9240556955337524} +11/06/2021 23:13:10 - INFO - __main__ - Step 14287: {'lr': 0.0004915463463669527, 'samples': 2743104, 'steps': 14286, 'loss/train': 2.307543992996216} +11/06/2021 23:13:11 - INFO - __main__ - Step 14288: {'lr': 0.0004915449779769589, 'samples': 2743296, 'steps': 14287, 'loss/train': 2.076409339904785} +11/06/2021 23:13:12 - INFO - __main__ - Step 14289: {'lr': 0.0004915436094781285, 'samples': 2743488, 'steps': 14288, 'loss/train': 1.6683952808380127} +11/06/2021 23:13:12 - INFO - __main__ - Step 14290: {'lr': 0.0004915422408704624, 'samples': 2743680, 'steps': 14289, 'loss/train': 1.3777574300765991} +11/06/2021 23:13:12 - INFO - __main__ - Step 14291: {'lr': 0.0004915408721539612, 'samples': 2743872, 'steps': 14290, 'loss/train': 1.556388020515442} +11/06/2021 23:13:13 - INFO - __main__ - Step 14292: {'lr': 0.0004915395033286251, 'samples': 2744064, 'steps': 14291, 'loss/train': 1.8184715509414673} +11/06/2021 23:13:13 - INFO - __main__ - Step 14293: {'lr': 0.0004915381343944552, 'samples': 2744256, 'steps': 14292, 'loss/train': 1.5744520425796509} +11/06/2021 23:13:14 - INFO - __main__ - Step 14294: {'lr': 0.0004915367653514521, 'samples': 2744448, 'steps': 14293, 'loss/train': 1.5268954038619995} +11/06/2021 23:13:14 - INFO - __main__ - Step 14295: {'lr': 0.0004915353961996161, 'samples': 2744640, 'steps': 14294, 'loss/train': 1.4393970966339111} +11/06/2021 23:13:15 - INFO - __main__ - Step 14296: {'lr': 0.000491534026938948, 'samples': 2744832, 'steps': 14295, 'loss/train': 1.8665683269500732} +11/06/2021 23:13:15 - INFO - __main__ - Step 14297: {'lr': 0.0004915326575694484, 'samples': 2745024, 'steps': 14296, 'loss/train': 2.0807924270629883} +11/06/2021 23:13:15 - INFO - __main__ - Step 14298: {'lr': 0.0004915312880911178, 'samples': 2745216, 'steps': 14297, 'loss/train': 1.800079345703125} +11/06/2021 23:13:16 - INFO - __main__ - Step 14299: {'lr': 0.000491529918503957, 'samples': 2745408, 'steps': 14298, 'loss/train': 1.6191036701202393} +11/06/2021 23:13:17 - INFO - __main__ - Step 14300: {'lr': 0.0004915285488079666, 'samples': 2745600, 'steps': 14299, 'loss/train': 1.6357394456863403} +11/06/2021 23:13:17 - INFO - __main__ - Step 14301: {'lr': 0.0004915271790031471, 'samples': 2745792, 'steps': 14300, 'loss/train': 1.8493192195892334} +11/06/2021 23:13:17 - INFO - __main__ - Step 14302: {'lr': 0.0004915258090894993, 'samples': 2745984, 'steps': 14301, 'loss/train': 1.3855708837509155} +11/06/2021 23:13:18 - INFO - __main__ - Step 14303: {'lr': 0.0004915244390670236, 'samples': 2746176, 'steps': 14302, 'loss/train': 1.6835711002349854} +11/06/2021 23:13:19 - INFO - __main__ - Step 14304: {'lr': 0.0004915230689357206, 'samples': 2746368, 'steps': 14303, 'loss/train': 1.9127839803695679} +11/06/2021 23:13:19 - INFO - __main__ - Step 14305: {'lr': 0.0004915216986955913, 'samples': 2746560, 'steps': 14304, 'loss/train': 1.7443958520889282} +11/06/2021 23:13:19 - INFO - __main__ - Step 14306: {'lr': 0.0004915203283466359, 'samples': 2746752, 'steps': 14305, 'loss/train': 1.8569912910461426} +11/06/2021 23:13:20 - INFO - __main__ - Step 14307: {'lr': 0.0004915189578888552, 'samples': 2746944, 'steps': 14306, 'loss/train': 2.002859354019165} +11/06/2021 23:13:20 - INFO - __main__ - Step 14308: {'lr': 0.0004915175873222497, 'samples': 2747136, 'steps': 14307, 'loss/train': 1.7802067995071411} +11/06/2021 23:13:21 - INFO - __main__ - Step 14309: {'lr': 0.0004915162166468201, 'samples': 2747328, 'steps': 14308, 'loss/train': 1.61421799659729} +11/06/2021 23:13:22 - INFO - __main__ - Step 14310: {'lr': 0.0004915148458625671, 'samples': 2747520, 'steps': 14309, 'loss/train': 1.5801818370819092} +11/06/2021 23:13:22 - INFO - __main__ - Step 14311: {'lr': 0.0004915134749694912, 'samples': 2747712, 'steps': 14310, 'loss/train': 1.24630606174469} +11/06/2021 23:13:22 - INFO - __main__ - Step 14312: {'lr': 0.000491512103967593, 'samples': 2747904, 'steps': 14311, 'loss/train': 1.8175888061523438} +11/06/2021 23:13:23 - INFO - __main__ - Step 14313: {'lr': 0.0004915107328568733, 'samples': 2748096, 'steps': 14312, 'loss/train': 1.7059366703033447} +11/06/2021 23:13:23 - INFO - __main__ - Step 14314: {'lr': 0.0004915093616373326, 'samples': 2748288, 'steps': 14313, 'loss/train': 1.2261815071105957} +11/06/2021 23:13:24 - INFO - __main__ - Step 14315: {'lr': 0.0004915079903089714, 'samples': 2748480, 'steps': 14314, 'loss/train': 1.8357681035995483} +11/06/2021 23:13:24 - INFO - __main__ - Step 14316: {'lr': 0.0004915066188717905, 'samples': 2748672, 'steps': 14315, 'loss/train': 1.671004056930542} +11/06/2021 23:13:25 - INFO - __main__ - Step 14317: {'lr': 0.0004915052473257904, 'samples': 2748864, 'steps': 14316, 'loss/train': 1.6903188228607178} +11/06/2021 23:13:25 - INFO - __main__ - Step 14318: {'lr': 0.0004915038756709717, 'samples': 2749056, 'steps': 14317, 'loss/train': 1.4683510065078735} +11/06/2021 23:13:25 - INFO - __main__ - Step 14319: {'lr': 0.0004915025039073352, 'samples': 2749248, 'steps': 14318, 'loss/train': 1.8368884325027466} +11/06/2021 23:13:26 - INFO - __main__ - Step 14320: {'lr': 0.0004915011320348814, 'samples': 2749440, 'steps': 14319, 'loss/train': 1.3511337041854858} +11/06/2021 23:13:27 - INFO - __main__ - Step 14321: {'lr': 0.0004914997600536108, 'samples': 2749632, 'steps': 14320, 'loss/train': 1.4233803749084473} +11/06/2021 23:13:27 - INFO - __main__ - Step 14322: {'lr': 0.0004914983879635242, 'samples': 2749824, 'steps': 14321, 'loss/train': 1.6688144207000732} +11/06/2021 23:13:28 - INFO - __main__ - Step 14323: {'lr': 0.0004914970157646222, 'samples': 2750016, 'steps': 14322, 'loss/train': 1.5857484340667725} +11/06/2021 23:13:28 - INFO - __main__ - Step 14324: {'lr': 0.0004914956434569054, 'samples': 2750208, 'steps': 14323, 'loss/train': 1.8138678073883057} +11/06/2021 23:13:29 - INFO - __main__ - Step 14325: {'lr': 0.0004914942710403743, 'samples': 2750400, 'steps': 14324, 'loss/train': 2.092402935028076} +11/06/2021 23:13:29 - INFO - __main__ - Step 14326: {'lr': 0.0004914928985150296, 'samples': 2750592, 'steps': 14325, 'loss/train': 1.820569396018982} +11/06/2021 23:13:30 - INFO - __main__ - Step 14327: {'lr': 0.0004914915258808719, 'samples': 2750784, 'steps': 14326, 'loss/train': 1.4420838356018066} +11/06/2021 23:13:30 - INFO - __main__ - Step 14328: {'lr': 0.0004914901531379019, 'samples': 2750976, 'steps': 14327, 'loss/train': 1.843706727027893} +11/06/2021 23:13:30 - INFO - __main__ - Step 14329: {'lr': 0.0004914887802861201, 'samples': 2751168, 'steps': 14328, 'loss/train': 1.7319104671478271} +11/06/2021 23:13:32 - INFO - __main__ - Step 14330: {'lr': 0.0004914874073255273, 'samples': 2751360, 'steps': 14329, 'loss/train': 1.3918893337249756} +11/06/2021 23:13:32 - INFO - __main__ - Step 14331: {'lr': 0.0004914860342561239, 'samples': 2751552, 'steps': 14330, 'loss/train': 1.587130069732666} +11/06/2021 23:13:32 - INFO - __main__ - Step 14332: {'lr': 0.0004914846610779107, 'samples': 2751744, 'steps': 14331, 'loss/train': 1.7063366174697876} +11/06/2021 23:13:33 - INFO - __main__ - Step 14333: {'lr': 0.0004914832877908881, 'samples': 2751936, 'steps': 14332, 'loss/train': 1.7004281282424927} +11/06/2021 23:13:33 - INFO - __main__ - Step 14334: {'lr': 0.0004914819143950571, 'samples': 2752128, 'steps': 14333, 'loss/train': 1.0245263576507568} +11/06/2021 23:13:33 - INFO - __main__ - Step 14335: {'lr': 0.0004914805408904179, 'samples': 2752320, 'steps': 14334, 'loss/train': 1.9465148448944092} +11/06/2021 23:13:34 - INFO - __main__ - Step 14336: {'lr': 0.0004914791672769713, 'samples': 2752512, 'steps': 14335, 'loss/train': 1.6169592142105103} +11/06/2021 23:13:35 - INFO - __main__ - Step 14337: {'lr': 0.000491477793554718, 'samples': 2752704, 'steps': 14336, 'loss/train': 1.842124342918396} +11/06/2021 23:13:35 - INFO - __main__ - Step 14338: {'lr': 0.0004914764197236584, 'samples': 2752896, 'steps': 14337, 'loss/train': 2.156404495239258} +11/06/2021 23:13:35 - INFO - __main__ - Step 14339: {'lr': 0.0004914750457837933, 'samples': 2753088, 'steps': 14338, 'loss/train': 2.6054229736328125} +11/06/2021 23:13:36 - INFO - __main__ - Step 14340: {'lr': 0.0004914736717351233, 'samples': 2753280, 'steps': 14339, 'loss/train': 0.8791477084159851} +11/06/2021 23:13:37 - INFO - __main__ - Step 14341: {'lr': 0.000491472297577649, 'samples': 2753472, 'steps': 14340, 'loss/train': 2.0689876079559326} +11/06/2021 23:13:37 - INFO - __main__ - Step 14342: {'lr': 0.000491470923311371, 'samples': 2753664, 'steps': 14341, 'loss/train': 2.8645334243774414} +11/06/2021 23:13:38 - INFO - __main__ - Step 14343: {'lr': 0.0004914695489362899, 'samples': 2753856, 'steps': 14342, 'loss/train': 1.755697250366211} +11/06/2021 23:13:38 - INFO - __main__ - Step 14344: {'lr': 0.0004914681744524064, 'samples': 2754048, 'steps': 14343, 'loss/train': 1.9771595001220703} +11/06/2021 23:13:38 - INFO - __main__ - Step 14345: {'lr': 0.0004914667998597211, 'samples': 2754240, 'steps': 14344, 'loss/train': 1.9034637212753296} +11/06/2021 23:13:39 - INFO - __main__ - Step 14346: {'lr': 0.0004914654251582344, 'samples': 2754432, 'steps': 14345, 'loss/train': 2.0097978115081787} +11/06/2021 23:13:40 - INFO - __main__ - Step 14347: {'lr': 0.0004914640503479473, 'samples': 2754624, 'steps': 14346, 'loss/train': 1.8135510683059692} +11/06/2021 23:13:40 - INFO - __main__ - Step 14348: {'lr': 0.0004914626754288601, 'samples': 2754816, 'steps': 14347, 'loss/train': 2.062073230743408} +11/06/2021 23:13:40 - INFO - __main__ - Step 14349: {'lr': 0.0004914613004009736, 'samples': 2755008, 'steps': 14348, 'loss/train': 1.3072386980056763} +11/06/2021 23:13:41 - INFO - __main__ - Step 14350: {'lr': 0.0004914599252642884, 'samples': 2755200, 'steps': 14349, 'loss/train': 1.7098357677459717} +11/06/2021 23:13:41 - INFO - __main__ - Step 14351: {'lr': 0.000491458550018805, 'samples': 2755392, 'steps': 14350, 'loss/train': 1.7779287099838257} +11/06/2021 23:13:42 - INFO - __main__ - Step 14352: {'lr': 0.0004914571746645242, 'samples': 2755584, 'steps': 14351, 'loss/train': 2.2135913372039795} +11/06/2021 23:13:43 - INFO - __main__ - Step 14353: {'lr': 0.0004914557992014465, 'samples': 2755776, 'steps': 14352, 'loss/train': 1.0863014459609985} +11/06/2021 23:13:43 - INFO - __main__ - Step 14354: {'lr': 0.0004914544236295725, 'samples': 2755968, 'steps': 14353, 'loss/train': 1.349368691444397} +11/06/2021 23:13:43 - INFO - __main__ - Step 14355: {'lr': 0.0004914530479489029, 'samples': 2756160, 'steps': 14354, 'loss/train': 1.2938106060028076} +11/06/2021 23:13:44 - INFO - __main__ - Step 14356: {'lr': 0.0004914516721594382, 'samples': 2756352, 'steps': 14355, 'loss/train': 1.8118442296981812} +11/06/2021 23:13:45 - INFO - __main__ - Step 14357: {'lr': 0.0004914502962611792, 'samples': 2756544, 'steps': 14356, 'loss/train': 1.9531524181365967} +11/06/2021 23:13:45 - INFO - __main__ - Step 14358: {'lr': 0.0004914489202541264, 'samples': 2756736, 'steps': 14357, 'loss/train': 1.827507734298706} +11/06/2021 23:13:45 - INFO - __main__ - Step 14359: {'lr': 0.0004914475441382804, 'samples': 2756928, 'steps': 14358, 'loss/train': 1.6210410594940186} +11/06/2021 23:13:46 - INFO - __main__ - Step 14360: {'lr': 0.0004914461679136419, 'samples': 2757120, 'steps': 14359, 'loss/train': 1.5644958019256592} +11/06/2021 23:13:46 - INFO - __main__ - Step 14361: {'lr': 0.0004914447915802115, 'samples': 2757312, 'steps': 14360, 'loss/train': 1.3498966693878174} +11/06/2021 23:13:47 - INFO - __main__ - Step 14362: {'lr': 0.0004914434151379898, 'samples': 2757504, 'steps': 14361, 'loss/train': 1.2043393850326538} +11/06/2021 23:13:47 - INFO - __main__ - Step 14363: {'lr': 0.0004914420385869773, 'samples': 2757696, 'steps': 14362, 'loss/train': 1.314516544342041} +11/06/2021 23:13:48 - INFO - __main__ - Step 14364: {'lr': 0.0004914406619271749, 'samples': 2757888, 'steps': 14363, 'loss/train': 1.803429126739502} +11/06/2021 23:13:48 - INFO - __main__ - Step 14365: {'lr': 0.0004914392851585829, 'samples': 2758080, 'steps': 14364, 'loss/train': 1.7351176738739014} +11/06/2021 23:13:48 - INFO - __main__ - Step 14366: {'lr': 0.0004914379082812023, 'samples': 2758272, 'steps': 14365, 'loss/train': 1.1345579624176025} +11/06/2021 23:13:49 - INFO - __main__ - Step 14367: {'lr': 0.0004914365312950333, 'samples': 2758464, 'steps': 14366, 'loss/train': 2.234651803970337} +11/06/2021 23:13:50 - INFO - __main__ - Step 14368: {'lr': 0.0004914351542000768, 'samples': 2758656, 'steps': 14367, 'loss/train': 1.3707553148269653} +11/06/2021 23:13:50 - INFO - __main__ - Step 14369: {'lr': 0.0004914337769963334, 'samples': 2758848, 'steps': 14368, 'loss/train': 1.8129569292068481} +11/06/2021 23:13:51 - INFO - __main__ - Step 14370: {'lr': 0.0004914323996838036, 'samples': 2759040, 'steps': 14369, 'loss/train': 1.368338942527771} +11/06/2021 23:13:51 - INFO - __main__ - Step 14371: {'lr': 0.0004914310222624881, 'samples': 2759232, 'steps': 14370, 'loss/train': 1.6486504077911377} +11/06/2021 23:13:51 - INFO - __main__ - Step 14372: {'lr': 0.0004914296447323875, 'samples': 2759424, 'steps': 14371, 'loss/train': 1.776429295539856} +11/06/2021 23:13:52 - INFO - __main__ - Step 14373: {'lr': 0.0004914282670935025, 'samples': 2759616, 'steps': 14372, 'loss/train': 1.8240113258361816} +11/06/2021 23:13:53 - INFO - __main__ - Step 14374: {'lr': 0.0004914268893458336, 'samples': 2759808, 'steps': 14373, 'loss/train': 1.7623484134674072} +11/06/2021 23:13:53 - INFO - __main__ - Step 14375: {'lr': 0.0004914255114893814, 'samples': 2760000, 'steps': 14374, 'loss/train': 1.851312518119812} +11/06/2021 23:13:53 - INFO - __main__ - Step 14376: {'lr': 0.0004914241335241467, 'samples': 2760192, 'steps': 14375, 'loss/train': 1.748906135559082} +11/06/2021 23:13:54 - INFO - __main__ - Step 14377: {'lr': 0.0004914227554501299, 'samples': 2760384, 'steps': 14376, 'loss/train': 0.8111178278923035} +11/06/2021 23:13:55 - INFO - __main__ - Step 14378: {'lr': 0.0004914213772673319, 'samples': 2760576, 'steps': 14377, 'loss/train': 0.3423219919204712} +11/06/2021 23:13:56 - INFO - __main__ - Step 14379: {'lr': 0.0004914199989757529, 'samples': 2760768, 'steps': 14378, 'loss/train': 1.715069055557251} +11/06/2021 23:13:56 - INFO - __main__ - Step 14380: {'lr': 0.000491418620575394, 'samples': 2760960, 'steps': 14379, 'loss/train': 1.3890851736068726} +11/06/2021 23:13:57 - INFO - __main__ - Step 14381: {'lr': 0.0004914172420662556, 'samples': 2761152, 'steps': 14380, 'loss/train': 1.8425896167755127} +11/06/2021 23:13:57 - INFO - __main__ - Step 14382: {'lr': 0.0004914158634483381, 'samples': 2761344, 'steps': 14381, 'loss/train': 1.8168810606002808} +11/06/2021 23:13:57 - INFO - __main__ - Step 14383: {'lr': 0.0004914144847216425, 'samples': 2761536, 'steps': 14382, 'loss/train': 1.2000967264175415} +11/06/2021 23:13:58 - INFO - __main__ - Step 14384: {'lr': 0.0004914131058861693, 'samples': 2761728, 'steps': 14383, 'loss/train': 1.7531344890594482} +11/06/2021 23:13:59 - INFO - __main__ - Step 14385: {'lr': 0.000491411726941919, 'samples': 2761920, 'steps': 14384, 'loss/train': 1.7564046382904053} +11/06/2021 23:13:59 - INFO - __main__ - Step 14386: {'lr': 0.0004914103478888922, 'samples': 2762112, 'steps': 14385, 'loss/train': 1.1627519130706787} +11/06/2021 23:13:59 - INFO - __main__ - Step 14387: {'lr': 0.0004914089687270898, 'samples': 2762304, 'steps': 14386, 'loss/train': 1.7761569023132324} +11/06/2021 23:14:00 - INFO - __main__ - Step 14388: {'lr': 0.0004914075894565122, 'samples': 2762496, 'steps': 14387, 'loss/train': 1.060185194015503} +11/06/2021 23:14:00 - INFO - __main__ - Step 14389: {'lr': 0.00049140621007716, 'samples': 2762688, 'steps': 14388, 'loss/train': 1.5696700811386108} +11/06/2021 23:14:01 - INFO - __main__ - Step 14390: {'lr': 0.0004914048305890339, 'samples': 2762880, 'steps': 14389, 'loss/train': 1.3252995014190674} +11/06/2021 23:14:01 - INFO - __main__ - Step 14391: {'lr': 0.0004914034509921345, 'samples': 2763072, 'steps': 14390, 'loss/train': 2.1088061332702637} +11/06/2021 23:14:02 - INFO - __main__ - Step 14392: {'lr': 0.0004914020712864626, 'samples': 2763264, 'steps': 14391, 'loss/train': 1.9577943086624146} +11/06/2021 23:14:02 - INFO - __main__ - Step 14393: {'lr': 0.0004914006914720184, 'samples': 2763456, 'steps': 14392, 'loss/train': 1.1342967748641968} +11/06/2021 23:14:03 - INFO - __main__ - Step 14394: {'lr': 0.0004913993115488029, 'samples': 2763648, 'steps': 14393, 'loss/train': 1.1955634355545044} +11/06/2021 23:14:03 - INFO - __main__ - Step 14395: {'lr': 0.0004913979315168167, 'samples': 2763840, 'steps': 14394, 'loss/train': 1.5130412578582764} +11/06/2021 23:14:04 - INFO - __main__ - Step 14396: {'lr': 0.0004913965513760601, 'samples': 2764032, 'steps': 14395, 'loss/train': 1.6799837350845337} +11/06/2021 23:14:04 - INFO - __main__ - Step 14397: {'lr': 0.0004913951711265341, 'samples': 2764224, 'steps': 14396, 'loss/train': 1.8832666873931885} +11/06/2021 23:14:05 - INFO - __main__ - Step 14398: {'lr': 0.0004913937907682391, 'samples': 2764416, 'steps': 14397, 'loss/train': 1.6365022659301758} +11/06/2021 23:14:05 - INFO - __main__ - Step 14399: {'lr': 0.0004913924103011757, 'samples': 2764608, 'steps': 14398, 'loss/train': 1.8931413888931274} +11/06/2021 23:14:05 - INFO - __main__ - Step 14400: {'lr': 0.0004913910297253448, 'samples': 2764800, 'steps': 14399, 'loss/train': 1.8184783458709717} +11/06/2021 23:14:06 - INFO - __main__ - Step 14401: {'lr': 0.0004913896490407467, 'samples': 2764992, 'steps': 14400, 'loss/train': 1.6293751001358032} +11/06/2021 23:14:07 - INFO - __main__ - Step 14402: {'lr': 0.0004913882682473821, 'samples': 2765184, 'steps': 14401, 'loss/train': 1.6088601350784302} +11/06/2021 23:14:07 - INFO - __main__ - Step 14403: {'lr': 0.0004913868873452519, 'samples': 2765376, 'steps': 14402, 'loss/train': 1.4631474018096924} +11/06/2021 23:14:07 - INFO - __main__ - Step 14404: {'lr': 0.0004913855063343563, 'samples': 2765568, 'steps': 14403, 'loss/train': 1.457092523574829} +11/06/2021 23:14:08 - INFO - __main__ - Step 14405: {'lr': 0.0004913841252146961, 'samples': 2765760, 'steps': 14404, 'loss/train': 1.6985125541687012} +11/06/2021 23:14:09 - INFO - __main__ - Step 14406: {'lr': 0.000491382743986272, 'samples': 2765952, 'steps': 14405, 'loss/train': 2.084760904312134} +11/06/2021 23:14:09 - INFO - __main__ - Step 14407: {'lr': 0.0004913813626490845, 'samples': 2766144, 'steps': 14406, 'loss/train': 1.3225696086883545} +11/06/2021 23:14:09 - INFO - __main__ - Step 14408: {'lr': 0.0004913799812031343, 'samples': 2766336, 'steps': 14407, 'loss/train': 1.6497886180877686} +11/06/2021 23:14:10 - INFO - __main__ - Step 14409: {'lr': 0.0004913785996484221, 'samples': 2766528, 'steps': 14408, 'loss/train': 1.065016746520996} +11/06/2021 23:14:10 - INFO - __main__ - Step 14410: {'lr': 0.0004913772179849483, 'samples': 2766720, 'steps': 14409, 'loss/train': 1.7048285007476807} +11/06/2021 23:14:11 - INFO - __main__ - Step 14411: {'lr': 0.0004913758362127137, 'samples': 2766912, 'steps': 14410, 'loss/train': 1.4540810585021973} +11/06/2021 23:14:11 - INFO - __main__ - Step 14412: {'lr': 0.0004913744543317189, 'samples': 2767104, 'steps': 14411, 'loss/train': 1.4666005373001099} +11/06/2021 23:14:12 - INFO - __main__ - Step 14413: {'lr': 0.0004913730723419645, 'samples': 2767296, 'steps': 14412, 'loss/train': 1.2720320224761963} +11/06/2021 23:14:12 - INFO - __main__ - Step 14414: {'lr': 0.000491371690243451, 'samples': 2767488, 'steps': 14413, 'loss/train': 1.3805193901062012} +11/06/2021 23:14:12 - INFO - __main__ - Step 14415: {'lr': 0.0004913703080361793, 'samples': 2767680, 'steps': 14414, 'loss/train': 2.1130664348602295} +11/06/2021 23:14:14 - INFO - __main__ - Step 14416: {'lr': 0.0004913689257201499, 'samples': 2767872, 'steps': 14415, 'loss/train': 1.317294955253601} +11/06/2021 23:14:14 - INFO - __main__ - Step 14417: {'lr': 0.0004913675432953633, 'samples': 2768064, 'steps': 14416, 'loss/train': 1.1042780876159668} +11/06/2021 23:14:14 - INFO - __main__ - Step 14418: {'lr': 0.0004913661607618202, 'samples': 2768256, 'steps': 14417, 'loss/train': 2.0876216888427734} +11/06/2021 23:14:15 - INFO - __main__ - Step 14419: {'lr': 0.0004913647781195212, 'samples': 2768448, 'steps': 14418, 'loss/train': 1.5809930562973022} +11/06/2021 23:14:15 - INFO - __main__ - Step 14420: {'lr': 0.000491363395368467, 'samples': 2768640, 'steps': 14419, 'loss/train': 0.730297863483429} +11/06/2021 23:14:15 - INFO - __main__ - Step 14421: {'lr': 0.0004913620125086581, 'samples': 2768832, 'steps': 14420, 'loss/train': 5.8645501136779785} +11/06/2021 23:14:16 - INFO - __main__ - Step 14422: {'lr': 0.0004913606295400953, 'samples': 2769024, 'steps': 14421, 'loss/train': 2.153425455093384} +11/06/2021 23:14:17 - INFO - __main__ - Step 14423: {'lr': 0.000491359246462779, 'samples': 2769216, 'steps': 14422, 'loss/train': 1.7173231840133667} +11/06/2021 23:14:17 - INFO - __main__ - Step 14424: {'lr': 0.0004913578632767101, 'samples': 2769408, 'steps': 14423, 'loss/train': 1.7363717555999756} +11/06/2021 23:14:18 - INFO - __main__ - Step 14425: {'lr': 0.0004913564799818891, 'samples': 2769600, 'steps': 14424, 'loss/train': 1.796966314315796} +11/06/2021 23:14:18 - INFO - __main__ - Step 14426: {'lr': 0.0004913550965783165, 'samples': 2769792, 'steps': 14425, 'loss/train': 1.8378410339355469} +11/06/2021 23:14:19 - INFO - __main__ - Step 14427: {'lr': 0.000491353713065993, 'samples': 2769984, 'steps': 14426, 'loss/train': 1.9022510051727295} +11/06/2021 23:14:19 - INFO - __main__ - Step 14428: {'lr': 0.0004913523294449193, 'samples': 2770176, 'steps': 14427, 'loss/train': 1.5578607320785522} +11/06/2021 23:14:20 - INFO - __main__ - Step 14429: {'lr': 0.0004913509457150959, 'samples': 2770368, 'steps': 14428, 'loss/train': 1.9274928569793701} +11/06/2021 23:14:20 - INFO - __main__ - Step 14430: {'lr': 0.0004913495618765235, 'samples': 2770560, 'steps': 14429, 'loss/train': 1.6800792217254639} +11/06/2021 23:14:20 - INFO - __main__ - Step 14431: {'lr': 0.0004913481779292027, 'samples': 2770752, 'steps': 14430, 'loss/train': 1.7277616262435913} +11/06/2021 23:14:21 - INFO - __main__ - Step 14432: {'lr': 0.0004913467938731341, 'samples': 2770944, 'steps': 14431, 'loss/train': 1.655822992324829} +11/06/2021 23:14:22 - INFO - __main__ - Step 14433: {'lr': 0.0004913454097083185, 'samples': 2771136, 'steps': 14432, 'loss/train': 1.733009696006775} +11/06/2021 23:14:22 - INFO - __main__ - Step 14434: {'lr': 0.0004913440254347563, 'samples': 2771328, 'steps': 14433, 'loss/train': 2.231706380844116} +11/06/2021 23:14:23 - INFO - __main__ - Step 14435: {'lr': 0.0004913426410524482, 'samples': 2771520, 'steps': 14434, 'loss/train': 0.5304341316223145} +11/06/2021 23:14:23 - INFO - __main__ - Step 14436: {'lr': 0.0004913412565613948, 'samples': 2771712, 'steps': 14435, 'loss/train': 1.5568188428878784} +11/06/2021 23:14:23 - INFO - __main__ - Step 14437: {'lr': 0.0004913398719615968, 'samples': 2771904, 'steps': 14436, 'loss/train': 1.682983160018921} +11/06/2021 23:14:24 - INFO - __main__ - Step 14438: {'lr': 0.0004913384872530548, 'samples': 2772096, 'steps': 14437, 'loss/train': 1.6241941452026367} +11/06/2021 23:14:25 - INFO - __main__ - Step 14439: {'lr': 0.0004913371024357694, 'samples': 2772288, 'steps': 14438, 'loss/train': 1.7349668741226196} +11/06/2021 23:14:25 - INFO - __main__ - Step 14440: {'lr': 0.0004913357175097412, 'samples': 2772480, 'steps': 14439, 'loss/train': 2.172203302383423} +11/06/2021 23:14:25 - INFO - __main__ - Step 14441: {'lr': 0.0004913343324749708, 'samples': 2772672, 'steps': 14440, 'loss/train': 0.5017638206481934} +11/06/2021 23:14:26 - INFO - __main__ - Step 14442: {'lr': 0.000491332947331459, 'samples': 2772864, 'steps': 14441, 'loss/train': 1.8418453931808472} +11/06/2021 23:14:27 - INFO - __main__ - Step 14443: {'lr': 0.0004913315620792061, 'samples': 2773056, 'steps': 14442, 'loss/train': 1.784220576286316} +11/06/2021 23:14:27 - INFO - __main__ - Step 14444: {'lr': 0.0004913301767182131, 'samples': 2773248, 'steps': 14443, 'loss/train': 1.6641216278076172} +11/06/2021 23:14:27 - INFO - __main__ - Step 14445: {'lr': 0.0004913287912484804, 'samples': 2773440, 'steps': 14444, 'loss/train': 1.1389085054397583} +11/06/2021 23:14:28 - INFO - __main__ - Step 14446: {'lr': 0.0004913274056700087, 'samples': 2773632, 'steps': 14445, 'loss/train': 1.5397385358810425} +11/06/2021 23:14:28 - INFO - __main__ - Step 14447: {'lr': 0.0004913260199827986, 'samples': 2773824, 'steps': 14446, 'loss/train': 2.1198136806488037} +11/06/2021 23:14:29 - INFO - __main__ - Step 14448: {'lr': 0.0004913246341868506, 'samples': 2774016, 'steps': 14447, 'loss/train': 1.6462889909744263} +11/06/2021 23:14:30 - INFO - __main__ - Step 14449: {'lr': 0.0004913232482821656, 'samples': 2774208, 'steps': 14448, 'loss/train': 1.6559960842132568} +11/06/2021 23:14:30 - INFO - __main__ - Step 14450: {'lr': 0.0004913218622687439, 'samples': 2774400, 'steps': 14449, 'loss/train': 1.4591246843338013} +11/06/2021 23:14:30 - INFO - __main__ - Step 14451: {'lr': 0.0004913204761465864, 'samples': 2774592, 'steps': 14450, 'loss/train': 1.9061264991760254} +11/06/2021 23:14:31 - INFO - __main__ - Step 14452: {'lr': 0.0004913190899156936, 'samples': 2774784, 'steps': 14451, 'loss/train': 1.592616081237793} +11/06/2021 23:14:31 - INFO - __main__ - Step 14453: {'lr': 0.0004913177035760661, 'samples': 2774976, 'steps': 14452, 'loss/train': 1.2767666578292847} +11/06/2021 23:14:32 - INFO - __main__ - Step 14454: {'lr': 0.0004913163171277046, 'samples': 2775168, 'steps': 14453, 'loss/train': 1.2585607767105103} +11/06/2021 23:14:32 - INFO - __main__ - Step 14455: {'lr': 0.0004913149305706097, 'samples': 2775360, 'steps': 14454, 'loss/train': 1.6764591932296753} +11/06/2021 23:14:33 - INFO - __main__ - Step 14456: {'lr': 0.0004913135439047821, 'samples': 2775552, 'steps': 14455, 'loss/train': 1.7716397047042847} +11/06/2021 23:14:33 - INFO - __main__ - Step 14457: {'lr': 0.0004913121571302222, 'samples': 2775744, 'steps': 14456, 'loss/train': 1.690000057220459} +11/06/2021 23:14:33 - INFO - __main__ - Step 14458: {'lr': 0.0004913107702469308, 'samples': 2775936, 'steps': 14457, 'loss/train': 1.5991852283477783} +11/06/2021 23:14:34 - INFO - __main__ - Step 14459: {'lr': 0.0004913093832549085, 'samples': 2776128, 'steps': 14458, 'loss/train': 1.8135044574737549} +11/06/2021 23:14:35 - INFO - __main__ - Step 14460: {'lr': 0.000491307996154156, 'samples': 2776320, 'steps': 14459, 'loss/train': 1.87995445728302} +11/06/2021 23:14:35 - INFO - __main__ - Step 14461: {'lr': 0.0004913066089446737, 'samples': 2776512, 'steps': 14460, 'loss/train': 1.2176554203033447} +11/06/2021 23:14:35 - INFO - __main__ - Step 14462: {'lr': 0.0004913052216264624, 'samples': 2776704, 'steps': 14461, 'loss/train': 1.4758261442184448} +11/06/2021 23:14:36 - INFO - __main__ - Step 14463: {'lr': 0.0004913038341995227, 'samples': 2776896, 'steps': 14462, 'loss/train': 1.7246683835983276} +11/06/2021 23:14:37 - INFO - __main__ - Step 14464: {'lr': 0.0004913024466638553, 'samples': 2777088, 'steps': 14463, 'loss/train': 1.7339403629302979} +11/06/2021 23:14:37 - INFO - __main__ - Step 14465: {'lr': 0.0004913010590194607, 'samples': 2777280, 'steps': 14464, 'loss/train': 1.6634852886199951} +11/06/2021 23:14:37 - INFO - __main__ - Step 14466: {'lr': 0.0004912996712663396, 'samples': 2777472, 'steps': 14465, 'loss/train': 1.24350106716156} +11/06/2021 23:14:38 - INFO - __main__ - Step 14467: {'lr': 0.0004912982834044924, 'samples': 2777664, 'steps': 14466, 'loss/train': 1.8824312686920166} +11/06/2021 23:14:38 - INFO - __main__ - Step 14468: {'lr': 0.0004912968954339202, 'samples': 2777856, 'steps': 14467, 'loss/train': 1.555679202079773} +11/06/2021 23:14:39 - INFO - __main__ - Step 14469: {'lr': 0.0004912955073546231, 'samples': 2778048, 'steps': 14468, 'loss/train': 1.743302345275879} +11/06/2021 23:14:40 - INFO - __main__ - Step 14470: {'lr': 0.0004912941191666021, 'samples': 2778240, 'steps': 14469, 'loss/train': 1.9434269666671753} +11/06/2021 23:14:40 - INFO - __main__ - Step 14471: {'lr': 0.0004912927308698576, 'samples': 2778432, 'steps': 14470, 'loss/train': 1.7462414503097534} +11/06/2021 23:14:40 - INFO - __main__ - Step 14472: {'lr': 0.0004912913424643904, 'samples': 2778624, 'steps': 14471, 'loss/train': 1.8691980838775635} +11/06/2021 23:14:41 - INFO - __main__ - Step 14473: {'lr': 0.0004912899539502011, 'samples': 2778816, 'steps': 14472, 'loss/train': 1.504024624824524} +11/06/2021 23:14:42 - INFO - __main__ - Step 14474: {'lr': 0.0004912885653272902, 'samples': 2779008, 'steps': 14473, 'loss/train': 0.9449915289878845} +11/06/2021 23:14:42 - INFO - __main__ - Step 14475: {'lr': 0.0004912871765956583, 'samples': 2779200, 'steps': 14474, 'loss/train': 1.7823172807693481} +11/06/2021 23:14:43 - INFO - __main__ - Step 14476: {'lr': 0.0004912857877553062, 'samples': 2779392, 'steps': 14475, 'loss/train': 1.6257444620132446} +11/06/2021 23:14:43 - INFO - __main__ - Step 14477: {'lr': 0.0004912843988062345, 'samples': 2779584, 'steps': 14476, 'loss/train': 1.8921669721603394} +11/06/2021 23:14:43 - INFO - __main__ - Step 14478: {'lr': 0.0004912830097484437, 'samples': 2779776, 'steps': 14477, 'loss/train': 1.9633761644363403} +11/06/2021 23:14:44 - INFO - __main__ - Step 14479: {'lr': 0.0004912816205819346, 'samples': 2779968, 'steps': 14478, 'loss/train': 1.5476384162902832} +11/06/2021 23:14:45 - INFO - __main__ - Step 14480: {'lr': 0.0004912802313067076, 'samples': 2780160, 'steps': 14479, 'loss/train': 1.160788893699646} +11/06/2021 23:14:45 - INFO - __main__ - Step 14481: {'lr': 0.0004912788419227635, 'samples': 2780352, 'steps': 14480, 'loss/train': 1.3065866231918335} +11/06/2021 23:14:45 - INFO - __main__ - Step 14482: {'lr': 0.000491277452430103, 'samples': 2780544, 'steps': 14481, 'loss/train': 1.6148895025253296} +11/06/2021 23:14:46 - INFO - __main__ - Step 14483: {'lr': 0.0004912760628287264, 'samples': 2780736, 'steps': 14482, 'loss/train': 0.9406113028526306} +11/06/2021 23:14:46 - INFO - __main__ - Step 14484: {'lr': 0.0004912746731186346, 'samples': 2780928, 'steps': 14483, 'loss/train': 1.4715304374694824} +11/06/2021 23:14:48 - INFO - __main__ - Step 14485: {'lr': 0.0004912732832998281, 'samples': 2781120, 'steps': 14484, 'loss/train': 1.742849349975586} +11/06/2021 23:14:48 - INFO - __main__ - Step 14486: {'lr': 0.0004912718933723077, 'samples': 2781312, 'steps': 14485, 'loss/train': 1.7313225269317627} +11/06/2021 23:14:48 - INFO - __main__ - Step 14487: {'lr': 0.0004912705033360738, 'samples': 2781504, 'steps': 14486, 'loss/train': 1.3565199375152588} +11/06/2021 23:14:49 - INFO - __main__ - Step 14488: {'lr': 0.0004912691131911272, 'samples': 2781696, 'steps': 14487, 'loss/train': 1.073344111442566} +11/06/2021 23:14:49 - INFO - __main__ - Step 14489: {'lr': 0.0004912677229374684, 'samples': 2781888, 'steps': 14488, 'loss/train': 1.5861188173294067} +11/06/2021 23:14:50 - INFO - __main__ - Step 14490: {'lr': 0.0004912663325750982, 'samples': 2782080, 'steps': 14489, 'loss/train': 1.8165336847305298} +11/06/2021 23:14:50 - INFO - __main__ - Step 14491: {'lr': 0.000491264942104017, 'samples': 2782272, 'steps': 14490, 'loss/train': 0.944426953792572} +11/06/2021 23:14:51 - INFO - __main__ - Step 14492: {'lr': 0.0004912635515242257, 'samples': 2782464, 'steps': 14491, 'loss/train': 0.730577826499939} +11/06/2021 23:14:51 - INFO - __main__ - Step 14493: {'lr': 0.0004912621608357246, 'samples': 2782656, 'steps': 14492, 'loss/train': 2.3794353008270264} +11/06/2021 23:14:52 - INFO - __main__ - Step 14494: {'lr': 0.0004912607700385146, 'samples': 2782848, 'steps': 14493, 'loss/train': 1.526907205581665} +11/06/2021 23:14:52 - INFO - __main__ - Step 14495: {'lr': 0.0004912593791325962, 'samples': 2783040, 'steps': 14494, 'loss/train': 0.6017135977745056} +11/06/2021 23:14:52 - INFO - __main__ - Step 14496: {'lr': 0.00049125798811797, 'samples': 2783232, 'steps': 14495, 'loss/train': 1.5702513456344604} +11/06/2021 23:14:53 - INFO - __main__ - Step 14497: {'lr': 0.0004912565969946367, 'samples': 2783424, 'steps': 14496, 'loss/train': 1.7380554676055908} +11/06/2021 23:14:54 - INFO - __main__ - Step 14498: {'lr': 0.0004912552057625969, 'samples': 2783616, 'steps': 14497, 'loss/train': 1.791672706604004} +11/06/2021 23:14:54 - INFO - __main__ - Step 14499: {'lr': 0.0004912538144218512, 'samples': 2783808, 'steps': 14498, 'loss/train': 1.8101961612701416} +11/06/2021 23:14:54 - INFO - __main__ - Step 14500: {'lr': 0.0004912524229724002, 'samples': 2784000, 'steps': 14499, 'loss/train': 1.174378752708435} +11/06/2021 23:14:55 - INFO - __main__ - Step 14501: {'lr': 0.0004912510314142447, 'samples': 2784192, 'steps': 14500, 'loss/train': 1.9984477758407593} +11/06/2021 23:14:56 - INFO - __main__ - Step 14502: {'lr': 0.0004912496397473852, 'samples': 2784384, 'steps': 14501, 'loss/train': 2.0241353511810303} +11/06/2021 23:14:56 - INFO - __main__ - Step 14503: {'lr': 0.0004912482479718223, 'samples': 2784576, 'steps': 14502, 'loss/train': 1.441446304321289} +11/06/2021 23:14:56 - INFO - __main__ - Step 14504: {'lr': 0.0004912468560875566, 'samples': 2784768, 'steps': 14503, 'loss/train': 1.7977668046951294} +11/06/2021 23:14:57 - INFO - __main__ - Step 14505: {'lr': 0.0004912454640945889, 'samples': 2784960, 'steps': 14504, 'loss/train': 1.8055917024612427} +11/06/2021 23:14:57 - INFO - __main__ - Step 14506: {'lr': 0.0004912440719929196, 'samples': 2785152, 'steps': 14505, 'loss/train': 1.3446134328842163} +11/06/2021 23:14:58 - INFO - __main__ - Step 14507: {'lr': 0.0004912426797825495, 'samples': 2785344, 'steps': 14506, 'loss/train': 1.7469252347946167} +11/06/2021 23:14:59 - INFO - __main__ - Step 14508: {'lr': 0.0004912412874634792, 'samples': 2785536, 'steps': 14507, 'loss/train': 1.3988752365112305} +11/06/2021 23:14:59 - INFO - __main__ - Step 14509: {'lr': 0.0004912398950357094, 'samples': 2785728, 'steps': 14508, 'loss/train': 2.2110788822174072} +11/06/2021 23:14:59 - INFO - __main__ - Step 14510: {'lr': 0.0004912385024992404, 'samples': 2785920, 'steps': 14509, 'loss/train': 1.4885571002960205} +11/06/2021 23:15:00 - INFO - __main__ - Step 14511: {'lr': 0.0004912371098540733, 'samples': 2786112, 'steps': 14510, 'loss/train': 2.1764931678771973} +11/06/2021 23:15:01 - INFO - __main__ - Step 14512: {'lr': 0.0004912357171002082, 'samples': 2786304, 'steps': 14511, 'loss/train': 1.1966614723205566} +11/06/2021 23:15:01 - INFO - __main__ - Step 14513: {'lr': 0.0004912343242376462, 'samples': 2786496, 'steps': 14512, 'loss/train': 1.392907738685608} +11/06/2021 23:15:01 - INFO - __main__ - Step 14514: {'lr': 0.0004912329312663877, 'samples': 2786688, 'steps': 14513, 'loss/train': 1.479630947113037} +11/06/2021 23:15:02 - INFO - __main__ - Step 14515: {'lr': 0.0004912315381864333, 'samples': 2786880, 'steps': 14514, 'loss/train': 1.7795805931091309} +11/06/2021 23:15:02 - INFO - __main__ - Step 14516: {'lr': 0.0004912301449977837, 'samples': 2787072, 'steps': 14515, 'loss/train': 1.7214689254760742} +11/06/2021 23:15:02 - INFO - __main__ - Step 14517: {'lr': 0.0004912287517004397, 'samples': 2787264, 'steps': 14516, 'loss/train': 1.5596206188201904} +11/06/2021 23:15:03 - INFO - __main__ - Step 14518: {'lr': 0.0004912273582944015, 'samples': 2787456, 'steps': 14517, 'loss/train': 1.3602560758590698} +11/06/2021 23:15:04 - INFO - __main__ - Step 14519: {'lr': 0.0004912259647796701, 'samples': 2787648, 'steps': 14518, 'loss/train': 1.7231316566467285} +11/06/2021 23:15:04 - INFO - __main__ - Step 14520: {'lr': 0.000491224571156246, 'samples': 2787840, 'steps': 14519, 'loss/train': 1.2232226133346558} +11/06/2021 23:15:05 - INFO - __main__ - Step 14521: {'lr': 0.0004912231774241298, 'samples': 2788032, 'steps': 14520, 'loss/train': 1.797451138496399} +11/06/2021 23:15:05 - INFO - __main__ - Step 14522: {'lr': 0.0004912217835833222, 'samples': 2788224, 'steps': 14521, 'loss/train': 0.9428983926773071} +11/06/2021 23:15:06 - INFO - __main__ - Step 14523: {'lr': 0.0004912203896338238, 'samples': 2788416, 'steps': 14522, 'loss/train': 1.4348275661468506} +11/06/2021 23:15:06 - INFO - __main__ - Step 14524: {'lr': 0.0004912189955756351, 'samples': 2788608, 'steps': 14523, 'loss/train': 1.5228583812713623} +11/06/2021 23:15:07 - INFO - __main__ - Step 14525: {'lr': 0.000491217601408757, 'samples': 2788800, 'steps': 14524, 'loss/train': 1.8126468658447266} +11/06/2021 23:15:07 - INFO - __main__ - Step 14526: {'lr': 0.0004912162071331898, 'samples': 2788992, 'steps': 14525, 'loss/train': 1.6764172315597534} +11/06/2021 23:15:07 - INFO - __main__ - Step 14527: {'lr': 0.0004912148127489345, 'samples': 2789184, 'steps': 14526, 'loss/train': 1.4271752834320068} +11/06/2021 23:15:08 - INFO - __main__ - Step 14528: {'lr': 0.0004912134182559913, 'samples': 2789376, 'steps': 14527, 'loss/train': 1.7659759521484375} +11/06/2021 23:15:09 - INFO - __main__ - Step 14529: {'lr': 0.0004912120236543611, 'samples': 2789568, 'steps': 14528, 'loss/train': 1.7609317302703857} +11/06/2021 23:15:09 - INFO - __main__ - Step 14530: {'lr': 0.0004912106289440446, 'samples': 2789760, 'steps': 14529, 'loss/train': 1.904273271560669} +11/06/2021 23:15:09 - INFO - __main__ - Step 14531: {'lr': 0.0004912092341250422, 'samples': 2789952, 'steps': 14530, 'loss/train': 1.7561595439910889} +11/06/2021 23:15:10 - INFO - __main__ - Step 14532: {'lr': 0.0004912078391973547, 'samples': 2790144, 'steps': 14531, 'loss/train': 1.3714295625686646} +11/06/2021 23:15:11 - INFO - __main__ - Step 14533: {'lr': 0.0004912064441609827, 'samples': 2790336, 'steps': 14532, 'loss/train': 1.4325453042984009} +11/06/2021 23:15:11 - INFO - __main__ - Step 14534: {'lr': 0.0004912050490159268, 'samples': 2790528, 'steps': 14533, 'loss/train': 1.7847373485565186} +11/06/2021 23:15:11 - INFO - __main__ - Step 14535: {'lr': 0.0004912036537621877, 'samples': 2790720, 'steps': 14534, 'loss/train': 2.0088417530059814} +11/06/2021 23:15:12 - INFO - __main__ - Step 14536: {'lr': 0.0004912022583997658, 'samples': 2790912, 'steps': 14535, 'loss/train': 1.3345286846160889} +11/06/2021 23:15:12 - INFO - __main__ - Step 14537: {'lr': 0.0004912008629286619, 'samples': 2791104, 'steps': 14536, 'loss/train': 1.6118730306625366} +11/06/2021 23:15:12 - INFO - __main__ - Step 14538: {'lr': 0.0004911994673488766, 'samples': 2791296, 'steps': 14537, 'loss/train': 1.377058982849121} +11/06/2021 23:15:14 - INFO - __main__ - Step 14539: {'lr': 0.0004911980716604107, 'samples': 2791488, 'steps': 14538, 'loss/train': 1.6407101154327393} +11/06/2021 23:15:14 - INFO - __main__ - Step 14540: {'lr': 0.0004911966758632645, 'samples': 2791680, 'steps': 14539, 'loss/train': 1.8519309759140015} +11/06/2021 23:15:14 - INFO - __main__ - Step 14541: {'lr': 0.000491195279957439, 'samples': 2791872, 'steps': 14540, 'loss/train': 1.6462745666503906} +11/06/2021 23:15:15 - INFO - __main__ - Step 14542: {'lr': 0.0004911938839429344, 'samples': 2792064, 'steps': 14541, 'loss/train': 1.8177210092544556} +11/06/2021 23:15:15 - INFO - __main__ - Step 14543: {'lr': 0.0004911924878197517, 'samples': 2792256, 'steps': 14542, 'loss/train': 2.063103437423706} +11/06/2021 23:15:16 - INFO - __main__ - Step 14544: {'lr': 0.0004911910915878913, 'samples': 2792448, 'steps': 14543, 'loss/train': 2.019076347351074} +11/06/2021 23:15:16 - INFO - __main__ - Step 14545: {'lr': 0.000491189695247354, 'samples': 2792640, 'steps': 14544, 'loss/train': 1.723437786102295} +11/06/2021 23:15:17 - INFO - __main__ - Step 14546: {'lr': 0.0004911882987981404, 'samples': 2792832, 'steps': 14545, 'loss/train': 1.8162659406661987} +11/06/2021 23:15:17 - INFO - __main__ - Step 14547: {'lr': 0.0004911869022402508, 'samples': 2793024, 'steps': 14546, 'loss/train': 1.8774888515472412} +11/06/2021 23:15:17 - INFO - __main__ - Step 14548: {'lr': 0.0004911855055736863, 'samples': 2793216, 'steps': 14547, 'loss/train': 1.6280256509780884} +11/06/2021 23:15:18 - INFO - __main__ - Step 14549: {'lr': 0.0004911841087984473, 'samples': 2793408, 'steps': 14548, 'loss/train': 1.9488242864608765} +11/06/2021 23:15:19 - INFO - __main__ - Step 14550: {'lr': 0.0004911827119145345, 'samples': 2793600, 'steps': 14549, 'loss/train': 2.1403818130493164} +11/06/2021 23:15:19 - INFO - __main__ - Step 14551: {'lr': 0.0004911813149219485, 'samples': 2793792, 'steps': 14550, 'loss/train': 1.7999236583709717} +11/06/2021 23:15:19 - INFO - __main__ - Step 14552: {'lr': 0.0004911799178206899, 'samples': 2793984, 'steps': 14551, 'loss/train': 1.94169020652771} +11/06/2021 23:15:20 - INFO - __main__ - Step 14553: {'lr': 0.0004911785206107592, 'samples': 2794176, 'steps': 14552, 'loss/train': 1.5757359266281128} +11/06/2021 23:15:21 - INFO - __main__ - Step 14554: {'lr': 0.0004911771232921575, 'samples': 2794368, 'steps': 14553, 'loss/train': 1.7550246715545654} +11/06/2021 23:15:21 - INFO - __main__ - Step 14555: {'lr': 0.0004911757258648849, 'samples': 2794560, 'steps': 14554, 'loss/train': 1.0412113666534424} +11/06/2021 23:15:22 - INFO - __main__ - Step 14556: {'lr': 0.0004911743283289423, 'samples': 2794752, 'steps': 14555, 'loss/train': 1.524915337562561} +11/06/2021 23:15:22 - INFO - __main__ - Step 14557: {'lr': 0.0004911729306843302, 'samples': 2794944, 'steps': 14556, 'loss/train': 1.9681403636932373} +11/06/2021 23:15:23 - INFO - __main__ - Step 14558: {'lr': 0.0004911715329310493, 'samples': 2795136, 'steps': 14557, 'loss/train': 1.4831455945968628} +11/06/2021 23:15:23 - INFO - __main__ - Step 14559: {'lr': 0.0004911701350691002, 'samples': 2795328, 'steps': 14558, 'loss/train': 0.9031453132629395} +11/06/2021 23:15:24 - INFO - __main__ - Step 14560: {'lr': 0.0004911687370984836, 'samples': 2795520, 'steps': 14559, 'loss/train': 1.7917287349700928} +11/06/2021 23:15:24 - INFO - __main__ - Step 14561: {'lr': 0.0004911673390192002, 'samples': 2795712, 'steps': 14560, 'loss/train': 1.3398245573043823} +11/06/2021 23:15:25 - INFO - __main__ - Step 14562: {'lr': 0.0004911659408312505, 'samples': 2795904, 'steps': 14561, 'loss/train': 1.7333766222000122} +11/06/2021 23:15:25 - INFO - __main__ - Step 14563: {'lr': 0.000491164542534635, 'samples': 2796096, 'steps': 14562, 'loss/train': 1.9331468343734741} +11/06/2021 23:15:25 - INFO - __main__ - Step 14564: {'lr': 0.0004911631441293546, 'samples': 2796288, 'steps': 14563, 'loss/train': 1.3357164859771729} +11/06/2021 23:15:26 - INFO - __main__ - Step 14565: {'lr': 0.0004911617456154097, 'samples': 2796480, 'steps': 14564, 'loss/train': 1.6416891813278198} +11/06/2021 23:15:27 - INFO - __main__ - Step 14566: {'lr': 0.0004911603469928012, 'samples': 2796672, 'steps': 14565, 'loss/train': 2.241854667663574} +11/06/2021 23:15:27 - INFO - __main__ - Step 14567: {'lr': 0.0004911589482615294, 'samples': 2796864, 'steps': 14566, 'loss/train': 0.8703035116195679} +11/06/2021 23:15:27 - INFO - __main__ - Step 14568: {'lr': 0.0004911575494215952, 'samples': 2797056, 'steps': 14567, 'loss/train': 1.3895127773284912} +11/06/2021 23:15:28 - INFO - __main__ - Step 14569: {'lr': 0.0004911561504729992, 'samples': 2797248, 'steps': 14568, 'loss/train': 3.218695878982544} +11/06/2021 23:15:28 - INFO - __main__ - Step 14570: {'lr': 0.0004911547514157417, 'samples': 2797440, 'steps': 14569, 'loss/train': 1.9162862300872803} +11/06/2021 23:15:29 - INFO - __main__ - Step 14571: {'lr': 0.0004911533522498239, 'samples': 2797632, 'steps': 14570, 'loss/train': 1.7870599031448364} +11/06/2021 23:15:29 - INFO - __main__ - Step 14572: {'lr': 0.0004911519529752459, 'samples': 2797824, 'steps': 14571, 'loss/train': 2.2179548740386963} +11/06/2021 23:15:30 - INFO - __main__ - Step 14573: {'lr': 0.0004911505535920086, 'samples': 2798016, 'steps': 14572, 'loss/train': 1.6157692670822144} +11/06/2021 23:15:30 - INFO - __main__ - Step 14574: {'lr': 0.0004911491541001126, 'samples': 2798208, 'steps': 14573, 'loss/train': 1.6204320192337036} +11/06/2021 23:15:30 - INFO - __main__ - Step 14575: {'lr': 0.0004911477544995585, 'samples': 2798400, 'steps': 14574, 'loss/train': 1.705611228942871} +11/06/2021 23:15:31 - INFO - __main__ - Step 14576: {'lr': 0.000491146354790347, 'samples': 2798592, 'steps': 14575, 'loss/train': 1.5545910596847534} +11/06/2021 23:15:32 - INFO - __main__ - Step 14577: {'lr': 0.0004911449549724786, 'samples': 2798784, 'steps': 14576, 'loss/train': 1.5566593408584595} +11/06/2021 23:15:32 - INFO - __main__ - Step 14578: {'lr': 0.0004911435550459541, 'samples': 2798976, 'steps': 14577, 'loss/train': 2.1471126079559326} +11/06/2021 23:15:32 - INFO - __main__ - Step 14579: {'lr': 0.0004911421550107739, 'samples': 2799168, 'steps': 14578, 'loss/train': 1.5826555490493774} +11/06/2021 23:15:33 - INFO - __main__ - Step 14580: {'lr': 0.0004911407548669389, 'samples': 2799360, 'steps': 14579, 'loss/train': 1.8544542789459229} +11/06/2021 23:15:34 - INFO - __main__ - Step 14581: {'lr': 0.0004911393546144495, 'samples': 2799552, 'steps': 14580, 'loss/train': 1.4082012176513672} +11/06/2021 23:15:34 - INFO - __main__ - Step 14582: {'lr': 0.0004911379542533065, 'samples': 2799744, 'steps': 14581, 'loss/train': 1.3058255910873413} +11/06/2021 23:15:35 - INFO - __main__ - Step 14583: {'lr': 0.0004911365537835105, 'samples': 2799936, 'steps': 14582, 'loss/train': 0.7232246398925781} +11/06/2021 23:15:35 - INFO - __main__ - Step 14584: {'lr': 0.000491135153205062, 'samples': 2800128, 'steps': 14583, 'loss/train': 1.6225132942199707} +11/06/2021 23:15:35 - INFO - __main__ - Step 14585: {'lr': 0.0004911337525179616, 'samples': 2800320, 'steps': 14584, 'loss/train': 1.6813801527023315} +11/06/2021 23:15:36 - INFO - __main__ - Step 14586: {'lr': 0.0004911323517222103, 'samples': 2800512, 'steps': 14585, 'loss/train': 1.8164918422698975} +11/06/2021 23:15:37 - INFO - __main__ - Step 14587: {'lr': 0.0004911309508178084, 'samples': 2800704, 'steps': 14586, 'loss/train': 1.225614309310913} +11/06/2021 23:15:37 - INFO - __main__ - Step 14588: {'lr': 0.0004911295498047565, 'samples': 2800896, 'steps': 14587, 'loss/train': 2.0302164554595947} +11/06/2021 23:15:37 - INFO - __main__ - Step 14589: {'lr': 0.0004911281486830554, 'samples': 2801088, 'steps': 14588, 'loss/train': 1.7795565128326416} +11/06/2021 23:15:38 - INFO - __main__ - Step 14590: {'lr': 0.0004911267474527058, 'samples': 2801280, 'steps': 14589, 'loss/train': 1.4832676649093628} +11/06/2021 23:15:39 - INFO - __main__ - Step 14591: {'lr': 0.000491125346113708, 'samples': 2801472, 'steps': 14590, 'loss/train': 1.647063136100769} +11/06/2021 23:15:39 - INFO - __main__ - Step 14592: {'lr': 0.000491123944666063, 'samples': 2801664, 'steps': 14591, 'loss/train': 1.9390480518341064} +11/06/2021 23:15:39 - INFO - __main__ - Step 14593: {'lr': 0.0004911225431097712, 'samples': 2801856, 'steps': 14592, 'loss/train': 1.7286971807479858} +11/06/2021 23:15:40 - INFO - __main__ - Step 14594: {'lr': 0.0004911211414448333, 'samples': 2802048, 'steps': 14593, 'loss/train': 1.6285250186920166} +11/06/2021 23:15:40 - INFO - __main__ - Step 14595: {'lr': 0.0004911197396712501, 'samples': 2802240, 'steps': 14594, 'loss/train': 1.946718692779541} +11/06/2021 23:15:41 - INFO - __main__ - Step 14596: {'lr': 0.0004911183377890218, 'samples': 2802432, 'steps': 14595, 'loss/train': 1.3001048564910889} +11/06/2021 23:15:42 - INFO - __main__ - Step 14597: {'lr': 0.0004911169357981496, 'samples': 2802624, 'steps': 14596, 'loss/train': 1.6624016761779785} +11/06/2021 23:15:42 - INFO - __main__ - Step 14598: {'lr': 0.0004911155336986335, 'samples': 2802816, 'steps': 14597, 'loss/train': 2.089146614074707} +11/06/2021 23:15:42 - INFO - __main__ - Step 14599: {'lr': 0.0004911141314904747, 'samples': 2803008, 'steps': 14598, 'loss/train': 1.3329648971557617} +11/06/2021 23:15:43 - INFO - __main__ - Step 14600: {'lr': 0.0004911127291736735, 'samples': 2803200, 'steps': 14599, 'loss/train': 1.4260157346725464} +11/06/2021 23:15:43 - INFO - __main__ - Step 14601: {'lr': 0.0004911113267482307, 'samples': 2803392, 'steps': 14600, 'loss/train': 1.7082431316375732} +11/06/2021 23:15:44 - INFO - __main__ - Step 14602: {'lr': 0.0004911099242141467, 'samples': 2803584, 'steps': 14601, 'loss/train': 1.4876233339309692} +11/06/2021 23:15:44 - INFO - __main__ - Step 14603: {'lr': 0.0004911085215714224, 'samples': 2803776, 'steps': 14602, 'loss/train': 1.9533902406692505} +11/06/2021 23:15:45 - INFO - __main__ - Step 14604: {'lr': 0.0004911071188200584, 'samples': 2803968, 'steps': 14603, 'loss/train': 2.090561866760254} +11/06/2021 23:15:45 - INFO - __main__ - Step 14605: {'lr': 0.0004911057159600551, 'samples': 2804160, 'steps': 14604, 'loss/train': 1.5187530517578125} +11/06/2021 23:15:45 - INFO - __main__ - Step 14606: {'lr': 0.0004911043129914133, 'samples': 2804352, 'steps': 14605, 'loss/train': 0.9737354516983032} +11/06/2021 23:15:46 - INFO - __main__ - Step 14607: {'lr': 0.0004911029099141336, 'samples': 2804544, 'steps': 14606, 'loss/train': 1.8305327892303467} +11/06/2021 23:15:47 - INFO - __main__ - Step 14608: {'lr': 0.0004911015067282168, 'samples': 2804736, 'steps': 14607, 'loss/train': 1.8033746480941772} +11/06/2021 23:15:47 - INFO - __main__ - Step 14609: {'lr': 0.0004911001034336633, 'samples': 2804928, 'steps': 14608, 'loss/train': 1.6968247890472412} +11/06/2021 23:15:47 - INFO - __main__ - Step 14610: {'lr': 0.0004910987000304737, 'samples': 2805120, 'steps': 14609, 'loss/train': 1.5940757989883423} +11/06/2021 23:15:48 - INFO - __main__ - Step 14611: {'lr': 0.0004910972965186488, 'samples': 2805312, 'steps': 14610, 'loss/train': 1.7843865156173706} +11/06/2021 23:15:48 - INFO - __main__ - Step 14612: {'lr': 0.0004910958928981893, 'samples': 2805504, 'steps': 14611, 'loss/train': 1.8916642665863037} +11/06/2021 23:15:49 - INFO - __main__ - Step 14613: {'lr': 0.0004910944891690956, 'samples': 2805696, 'steps': 14612, 'loss/train': 1.5665946006774902} +11/06/2021 23:15:49 - INFO - __main__ - Step 14614: {'lr': 0.0004910930853313686, 'samples': 2805888, 'steps': 14613, 'loss/train': 1.1098638772964478} +11/06/2021 23:15:50 - INFO - __main__ - Step 14615: {'lr': 0.0004910916813850086, 'samples': 2806080, 'steps': 14614, 'loss/train': 1.3663274049758911} +11/06/2021 23:15:50 - INFO - __main__ - Step 14616: {'lr': 0.0004910902773300164, 'samples': 2806272, 'steps': 14615, 'loss/train': 1.2368197441101074} +11/06/2021 23:15:51 - INFO - __main__ - Step 14617: {'lr': 0.0004910888731663928, 'samples': 2806464, 'steps': 14616, 'loss/train': 1.519328236579895} +11/06/2021 23:15:52 - INFO - __main__ - Step 14618: {'lr': 0.0004910874688941381, 'samples': 2806656, 'steps': 14617, 'loss/train': 1.4356929063796997} +11/06/2021 23:15:52 - INFO - __main__ - Step 14619: {'lr': 0.0004910860645132532, 'samples': 2806848, 'steps': 14618, 'loss/train': 1.3084660768508911} +11/06/2021 23:15:52 - INFO - __main__ - Step 14620: {'lr': 0.0004910846600237386, 'samples': 2807040, 'steps': 14619, 'loss/train': 1.374779224395752} +11/06/2021 23:15:53 - INFO - __main__ - Step 14621: {'lr': 0.0004910832554255951, 'samples': 2807232, 'steps': 14620, 'loss/train': 1.7540532350540161} +11/06/2021 23:15:53 - INFO - __main__ - Step 14622: {'lr': 0.0004910818507188231, 'samples': 2807424, 'steps': 14621, 'loss/train': 1.5536149740219116} +11/06/2021 23:15:54 - INFO - __main__ - Step 14623: {'lr': 0.0004910804459034233, 'samples': 2807616, 'steps': 14622, 'loss/train': 1.8700112104415894} +11/06/2021 23:15:55 - INFO - __main__ - Step 14624: {'lr': 0.0004910790409793965, 'samples': 2807808, 'steps': 14623, 'loss/train': 1.8716275691986084} +11/06/2021 23:15:55 - INFO - __main__ - Step 14625: {'lr': 0.000491077635946743, 'samples': 2808000, 'steps': 14624, 'loss/train': 1.835631012916565} +11/06/2021 23:15:55 - INFO - __main__ - Step 14626: {'lr': 0.0004910762308054638, 'samples': 2808192, 'steps': 14625, 'loss/train': 1.5419883728027344} +11/06/2021 23:15:56 - INFO - __main__ - Step 14627: {'lr': 0.0004910748255555593, 'samples': 2808384, 'steps': 14626, 'loss/train': 0.7711548805236816} +11/06/2021 23:15:56 - INFO - __main__ - Step 14628: {'lr': 0.0004910734201970302, 'samples': 2808576, 'steps': 14627, 'loss/train': 1.3061710596084595} +11/06/2021 23:15:57 - INFO - __main__ - Step 14629: {'lr': 0.0004910720147298772, 'samples': 2808768, 'steps': 14628, 'loss/train': 1.5132771730422974} +11/06/2021 23:15:58 - INFO - __main__ - Step 14630: {'lr': 0.0004910706091541009, 'samples': 2808960, 'steps': 14629, 'loss/train': 1.1088963747024536} +11/06/2021 23:15:58 - INFO - __main__ - Step 14631: {'lr': 0.0004910692034697018, 'samples': 2809152, 'steps': 14630, 'loss/train': 1.5924564599990845} +11/06/2021 23:15:58 - INFO - __main__ - Step 14632: {'lr': 0.0004910677976766807, 'samples': 2809344, 'steps': 14631, 'loss/train': 1.2352012395858765} +11/06/2021 23:15:59 - INFO - __main__ - Step 14633: {'lr': 0.0004910663917750382, 'samples': 2809536, 'steps': 14632, 'loss/train': 1.8392850160598755} +11/06/2021 23:15:59 - INFO - __main__ - Step 14634: {'lr': 0.0004910649857647748, 'samples': 2809728, 'steps': 14633, 'loss/train': 1.6638622283935547} +11/06/2021 23:16:00 - INFO - __main__ - Step 14635: {'lr': 0.0004910635796458913, 'samples': 2809920, 'steps': 14634, 'loss/train': 2.037661075592041} +11/06/2021 23:16:00 - INFO - __main__ - Step 14636: {'lr': 0.0004910621734183882, 'samples': 2810112, 'steps': 14635, 'loss/train': 0.8195475935935974} +11/06/2021 23:16:01 - INFO - __main__ - Step 14637: {'lr': 0.0004910607670822663, 'samples': 2810304, 'steps': 14636, 'loss/train': 1.5160691738128662} +11/06/2021 23:16:01 - INFO - __main__ - Step 14638: {'lr': 0.0004910593606375261, 'samples': 2810496, 'steps': 14637, 'loss/train': 2.147937297821045} +11/06/2021 23:16:02 - INFO - __main__ - Step 14639: {'lr': 0.0004910579540841683, 'samples': 2810688, 'steps': 14638, 'loss/train': 0.8111184239387512} +11/06/2021 23:16:03 - INFO - __main__ - Step 14640: {'lr': 0.0004910565474221934, 'samples': 2810880, 'steps': 14639, 'loss/train': 1.6241923570632935} +11/06/2021 23:16:03 - INFO - __main__ - Step 14641: {'lr': 0.0004910551406516022, 'samples': 2811072, 'steps': 14640, 'loss/train': 2.166555404663086} +11/06/2021 23:16:03 - INFO - __main__ - Step 14642: {'lr': 0.0004910537337723954, 'samples': 2811264, 'steps': 14641, 'loss/train': 1.8136534690856934} +11/06/2021 23:16:04 - INFO - __main__ - Step 14643: {'lr': 0.0004910523267845733, 'samples': 2811456, 'steps': 14642, 'loss/train': 1.5173137187957764} +11/06/2021 23:16:04 - INFO - __main__ - Step 14644: {'lr': 0.0004910509196881369, 'samples': 2811648, 'steps': 14643, 'loss/train': 1.1134371757507324} +11/06/2021 23:16:05 - INFO - __main__ - Step 14645: {'lr': 0.0004910495124830866, 'samples': 2811840, 'steps': 14644, 'loss/train': 1.4934502840042114} +11/06/2021 23:16:05 - INFO - __main__ - Step 14646: {'lr': 0.0004910481051694231, 'samples': 2812032, 'steps': 14645, 'loss/train': 1.9416497945785522} +11/06/2021 23:16:06 - INFO - __main__ - Step 14647: {'lr': 0.0004910466977471471, 'samples': 2812224, 'steps': 14646, 'loss/train': 1.6827425956726074} +11/06/2021 23:16:06 - INFO - __main__ - Step 14648: {'lr': 0.0004910452902162592, 'samples': 2812416, 'steps': 14647, 'loss/train': 1.602482795715332} +11/06/2021 23:16:06 - INFO - __main__ - Step 14649: {'lr': 0.0004910438825767599, 'samples': 2812608, 'steps': 14648, 'loss/train': 1.5670403242111206} +11/06/2021 23:16:08 - INFO - __main__ - Step 14650: {'lr': 0.00049104247482865, 'samples': 2812800, 'steps': 14649, 'loss/train': 1.4646493196487427} +11/06/2021 23:16:08 - INFO - __main__ - Step 14651: {'lr': 0.0004910410669719301, 'samples': 2812992, 'steps': 14650, 'loss/train': 1.5942716598510742} +11/06/2021 23:16:08 - INFO - __main__ - Step 14652: {'lr': 0.0004910396590066008, 'samples': 2813184, 'steps': 14651, 'loss/train': 1.6040905714035034} +11/06/2021 23:16:09 - INFO - __main__ - Step 14653: {'lr': 0.0004910382509326627, 'samples': 2813376, 'steps': 14652, 'loss/train': 2.0839693546295166} +11/06/2021 23:16:09 - INFO - __main__ - Step 14654: {'lr': 0.0004910368427501166, 'samples': 2813568, 'steps': 14653, 'loss/train': 1.966593861579895} +11/06/2021 23:16:10 - INFO - __main__ - Step 14655: {'lr': 0.000491035434458963, 'samples': 2813760, 'steps': 14654, 'loss/train': 2.07354998588562} +11/06/2021 23:16:10 - INFO - __main__ - Step 14656: {'lr': 0.0004910340260592024, 'samples': 2813952, 'steps': 14655, 'loss/train': 1.6633130311965942} +11/06/2021 23:16:11 - INFO - __main__ - Step 14657: {'lr': 0.0004910326175508357, 'samples': 2814144, 'steps': 14656, 'loss/train': 2.252934694290161} +11/06/2021 23:16:11 - INFO - __main__ - Step 14658: {'lr': 0.0004910312089338634, 'samples': 2814336, 'steps': 14657, 'loss/train': 1.369263768196106} +11/06/2021 23:16:11 - INFO - __main__ - Step 14659: {'lr': 0.0004910298002082863, 'samples': 2814528, 'steps': 14658, 'loss/train': 1.274910807609558} +11/06/2021 23:16:12 - INFO - __main__ - Step 14660: {'lr': 0.0004910283913741047, 'samples': 2814720, 'steps': 14659, 'loss/train': 1.555715560913086} +11/06/2021 23:16:13 - INFO - __main__ - Step 14661: {'lr': 0.0004910269824313194, 'samples': 2814912, 'steps': 14660, 'loss/train': 1.4081352949142456} +11/06/2021 23:16:13 - INFO - __main__ - Step 14662: {'lr': 0.0004910255733799312, 'samples': 2815104, 'steps': 14661, 'loss/train': 1.7849104404449463} +11/06/2021 23:16:13 - INFO - __main__ - Step 14663: {'lr': 0.0004910241642199406, 'samples': 2815296, 'steps': 14662, 'loss/train': 1.4840021133422852} +11/06/2021 23:16:14 - INFO - __main__ - Step 14664: {'lr': 0.0004910227549513481, 'samples': 2815488, 'steps': 14663, 'loss/train': 1.7678169012069702} +11/06/2021 23:16:14 - INFO - __main__ - Step 14665: {'lr': 0.0004910213455741546, 'samples': 2815680, 'steps': 14664, 'loss/train': 1.6775918006896973} +11/06/2021 23:16:15 - INFO - __main__ - Step 14666: {'lr': 0.0004910199360883605, 'samples': 2815872, 'steps': 14665, 'loss/train': 1.950029969215393} +11/06/2021 23:16:16 - INFO - __main__ - Step 14667: {'lr': 0.0004910185264939667, 'samples': 2816064, 'steps': 14666, 'loss/train': 1.7304264307022095} +11/06/2021 23:16:16 - INFO - __main__ - Step 14668: {'lr': 0.0004910171167909734, 'samples': 2816256, 'steps': 14667, 'loss/train': 1.4172935485839844} +11/06/2021 23:16:16 - INFO - __main__ - Step 14669: {'lr': 0.0004910157069793816, 'samples': 2816448, 'steps': 14668, 'loss/train': 1.8779479265213013} +11/06/2021 23:16:17 - INFO - __main__ - Step 14670: {'lr': 0.000491014297059192, 'samples': 2816640, 'steps': 14669, 'loss/train': 1.943215012550354} +11/06/2021 23:16:18 - INFO - __main__ - Step 14671: {'lr': 0.000491012887030405, 'samples': 2816832, 'steps': 14670, 'loss/train': 1.6946277618408203} +11/06/2021 23:16:18 - INFO - __main__ - Step 14672: {'lr': 0.0004910114768930212, 'samples': 2817024, 'steps': 14671, 'loss/train': 1.4919730424880981} +11/06/2021 23:16:18 - INFO - __main__ - Step 14673: {'lr': 0.0004910100666470415, 'samples': 2817216, 'steps': 14672, 'loss/train': 1.942678689956665} +11/06/2021 23:16:19 - INFO - __main__ - Step 14674: {'lr': 0.0004910086562924663, 'samples': 2817408, 'steps': 14673, 'loss/train': 1.5062963962554932} +11/06/2021 23:16:19 - INFO - __main__ - Step 14675: {'lr': 0.0004910072458292963, 'samples': 2817600, 'steps': 14674, 'loss/train': 1.1559689044952393} +11/06/2021 23:16:20 - INFO - __main__ - Step 14676: {'lr': 0.0004910058352575322, 'samples': 2817792, 'steps': 14675, 'loss/train': 1.5200366973876953} +11/06/2021 23:16:20 - INFO - __main__ - Step 14677: {'lr': 0.0004910044245771745, 'samples': 2817984, 'steps': 14676, 'loss/train': 1.2778904438018799} +11/06/2021 23:16:21 - INFO - __main__ - Step 14678: {'lr': 0.0004910030137882241, 'samples': 2818176, 'steps': 14677, 'loss/train': 2.667948007583618} +11/06/2021 23:16:21 - INFO - __main__ - Step 14679: {'lr': 0.0004910016028906813, 'samples': 2818368, 'steps': 14678, 'loss/train': 2.185955047607422} +11/06/2021 23:16:22 - INFO - __main__ - Step 14680: {'lr': 0.000491000191884547, 'samples': 2818560, 'steps': 14679, 'loss/train': 1.723203420639038} +11/06/2021 23:16:23 - INFO - __main__ - Step 14681: {'lr': 0.0004909987807698217, 'samples': 2818752, 'steps': 14680, 'loss/train': 1.139530062675476} +11/06/2021 23:16:23 - INFO - __main__ - Step 14682: {'lr': 0.000490997369546506, 'samples': 2818944, 'steps': 14681, 'loss/train': 1.7487425804138184} +11/06/2021 23:16:23 - INFO - __main__ - Step 14683: {'lr': 0.0004909959582146007, 'samples': 2819136, 'steps': 14682, 'loss/train': 1.6787686347961426} +11/06/2021 23:16:24 - INFO - __main__ - Step 14684: {'lr': 0.0004909945467741063, 'samples': 2819328, 'steps': 14683, 'loss/train': 1.1271356344223022} +11/06/2021 23:16:24 - INFO - __main__ - Step 14685: {'lr': 0.0004909931352250235, 'samples': 2819520, 'steps': 14684, 'loss/train': 3.540257453918457} +11/06/2021 23:16:24 - INFO - __main__ - Step 14686: {'lr': 0.0004909917235673529, 'samples': 2819712, 'steps': 14685, 'loss/train': 1.8830620050430298} +11/06/2021 23:16:25 - INFO - __main__ - Step 14687: {'lr': 0.0004909903118010951, 'samples': 2819904, 'steps': 14686, 'loss/train': 1.717665433883667} +11/06/2021 23:16:26 - INFO - __main__ - Step 14688: {'lr': 0.0004909888999262509, 'samples': 2820096, 'steps': 14687, 'loss/train': 0.35629066824913025} +11/06/2021 23:16:26 - INFO - __main__ - Step 14689: {'lr': 0.0004909874879428207, 'samples': 2820288, 'steps': 14688, 'loss/train': 1.5923266410827637} +11/06/2021 23:16:26 - INFO - __main__ - Step 14690: {'lr': 0.0004909860758508052, 'samples': 2820480, 'steps': 14689, 'loss/train': 1.798073172569275} +11/06/2021 23:16:27 - INFO - __main__ - Step 14691: {'lr': 0.0004909846636502053, 'samples': 2820672, 'steps': 14690, 'loss/train': 1.2456002235412598} +11/06/2021 23:16:28 - INFO - __main__ - Step 14692: {'lr': 0.0004909832513410213, 'samples': 2820864, 'steps': 14691, 'loss/train': 1.8775510787963867} +11/06/2021 23:16:28 - INFO - __main__ - Step 14693: {'lr': 0.000490981838923254, 'samples': 2821056, 'steps': 14692, 'loss/train': 2.1554715633392334} +11/06/2021 23:16:29 - INFO - __main__ - Step 14694: {'lr': 0.000490980426396904, 'samples': 2821248, 'steps': 14693, 'loss/train': 1.8785821199417114} +11/06/2021 23:16:29 - INFO - __main__ - Step 14695: {'lr': 0.0004909790137619719, 'samples': 2821440, 'steps': 14694, 'loss/train': 1.473230242729187} +11/06/2021 23:16:29 - INFO - __main__ - Step 14696: {'lr': 0.0004909776010184585, 'samples': 2821632, 'steps': 14695, 'loss/train': 1.770862340927124} +11/06/2021 23:16:30 - INFO - __main__ - Step 14697: {'lr': 0.0004909761881663642, 'samples': 2821824, 'steps': 14696, 'loss/train': 1.7851510047912598} +11/06/2021 23:16:31 - INFO - __main__ - Step 14698: {'lr': 0.0004909747752056897, 'samples': 2822016, 'steps': 14697, 'loss/train': 1.8535454273223877} +11/06/2021 23:16:31 - INFO - __main__ - Step 14699: {'lr': 0.0004909733621364358, 'samples': 2822208, 'steps': 14698, 'loss/train': 1.4395469427108765} +11/06/2021 23:16:31 - INFO - __main__ - Step 14700: {'lr': 0.0004909719489586029, 'samples': 2822400, 'steps': 14699, 'loss/train': 1.9752013683319092} +11/06/2021 23:16:32 - INFO - __main__ - Step 14701: {'lr': 0.0004909705356721919, 'samples': 2822592, 'steps': 14700, 'loss/train': 1.4780222177505493} +11/06/2021 23:16:32 - INFO - __main__ - Step 14702: {'lr': 0.0004909691222772032, 'samples': 2822784, 'steps': 14701, 'loss/train': 1.6931217908859253} +11/06/2021 23:16:33 - INFO - __main__ - Step 14703: {'lr': 0.0004909677087736375, 'samples': 2822976, 'steps': 14702, 'loss/train': 1.33567214012146} +11/06/2021 23:16:33 - INFO - __main__ - Step 14704: {'lr': 0.0004909662951614955, 'samples': 2823168, 'steps': 14703, 'loss/train': 1.3383984565734863} +11/06/2021 23:16:34 - INFO - __main__ - Step 14705: {'lr': 0.0004909648814407779, 'samples': 2823360, 'steps': 14704, 'loss/train': 1.8960798978805542} +11/06/2021 23:16:34 - INFO - __main__ - Step 14706: {'lr': 0.0004909634676114851, 'samples': 2823552, 'steps': 14705, 'loss/train': 1.757364273071289} +11/06/2021 23:16:34 - INFO - __main__ - Step 14707: {'lr': 0.000490962053673618, 'samples': 2823744, 'steps': 14706, 'loss/train': 1.1211416721343994} +11/06/2021 23:16:36 - INFO - __main__ - Step 14708: {'lr': 0.0004909606396271771, 'samples': 2823936, 'steps': 14707, 'loss/train': 1.9302036762237549} +11/06/2021 23:16:36 - INFO - __main__ - Step 14709: {'lr': 0.000490959225472163, 'samples': 2824128, 'steps': 14708, 'loss/train': 1.3645907640457153} +11/06/2021 23:16:36 - INFO - __main__ - Step 14710: {'lr': 0.0004909578112085764, 'samples': 2824320, 'steps': 14709, 'loss/train': 1.793792724609375} +11/06/2021 23:16:37 - INFO - __main__ - Step 14711: {'lr': 0.0004909563968364179, 'samples': 2824512, 'steps': 14710, 'loss/train': 1.516960859298706} +11/06/2021 23:16:37 - INFO - __main__ - Step 14712: {'lr': 0.0004909549823556883, 'samples': 2824704, 'steps': 14711, 'loss/train': 1.5521596670150757} +11/06/2021 23:16:37 - INFO - __main__ - Step 14713: {'lr': 0.000490953567766388, 'samples': 2824896, 'steps': 14712, 'loss/train': 1.9512124061584473} +11/06/2021 23:16:38 - INFO - __main__ - Step 14714: {'lr': 0.0004909521530685177, 'samples': 2825088, 'steps': 14713, 'loss/train': 2.1272761821746826} +11/06/2021 23:16:39 - INFO - __main__ - Step 14715: {'lr': 0.0004909507382620782, 'samples': 2825280, 'steps': 14714, 'loss/train': 1.705784559249878} +11/06/2021 23:16:39 - INFO - __main__ - Step 14716: {'lr': 0.0004909493233470699, 'samples': 2825472, 'steps': 14715, 'loss/train': 1.458823323249817} +11/06/2021 23:16:40 - INFO - __main__ - Step 14717: {'lr': 0.0004909479083234936, 'samples': 2825664, 'steps': 14716, 'loss/train': 1.4705344438552856} +11/06/2021 23:16:40 - INFO - __main__ - Step 14718: {'lr': 0.0004909464931913499, 'samples': 2825856, 'steps': 14717, 'loss/train': 2.149104118347168} +11/06/2021 23:16:41 - INFO - __main__ - Step 14719: {'lr': 0.0004909450779506393, 'samples': 2826048, 'steps': 14718, 'loss/train': 1.4514827728271484} +11/06/2021 23:16:41 - INFO - __main__ - Step 14720: {'lr': 0.0004909436626013628, 'samples': 2826240, 'steps': 14719, 'loss/train': 1.459384799003601} +11/06/2021 23:16:42 - INFO - __main__ - Step 14721: {'lr': 0.0004909422471435207, 'samples': 2826432, 'steps': 14720, 'loss/train': 1.9327574968338013} +11/06/2021 23:16:42 - INFO - __main__ - Step 14722: {'lr': 0.0004909408315771136, 'samples': 2826624, 'steps': 14721, 'loss/train': 1.8887290954589844} +11/06/2021 23:16:42 - INFO - __main__ - Step 14723: {'lr': 0.0004909394159021425, 'samples': 2826816, 'steps': 14722, 'loss/train': 1.6616466045379639} +11/06/2021 23:16:43 - INFO - __main__ - Step 14724: {'lr': 0.0004909380001186077, 'samples': 2827008, 'steps': 14723, 'loss/train': 1.528913974761963} +11/06/2021 23:16:44 - INFO - __main__ - Step 14725: {'lr': 0.00049093658422651, 'samples': 2827200, 'steps': 14724, 'loss/train': 1.4247432947158813} +11/06/2021 23:16:44 - INFO - __main__ - Step 14726: {'lr': 0.00049093516822585, 'samples': 2827392, 'steps': 14725, 'loss/train': 2.329897165298462} +11/06/2021 23:16:44 - INFO - __main__ - Step 14727: {'lr': 0.0004909337521166282, 'samples': 2827584, 'steps': 14726, 'loss/train': 1.4586058855056763} +11/06/2021 23:16:45 - INFO - __main__ - Step 14728: {'lr': 0.0004909323358988455, 'samples': 2827776, 'steps': 14727, 'loss/train': 1.297971487045288} +11/06/2021 23:16:45 - INFO - __main__ - Step 14729: {'lr': 0.0004909309195725024, 'samples': 2827968, 'steps': 14728, 'loss/train': 1.9658069610595703} +11/06/2021 23:16:46 - INFO - __main__ - Step 14730: {'lr': 0.0004909295031375996, 'samples': 2828160, 'steps': 14729, 'loss/train': 1.5267490148544312} +11/06/2021 23:16:47 - INFO - __main__ - Step 14731: {'lr': 0.0004909280865941375, 'samples': 2828352, 'steps': 14730, 'loss/train': 1.8899013996124268} +11/06/2021 23:16:47 - INFO - __main__ - Step 14732: {'lr': 0.0004909266699421171, 'samples': 2828544, 'steps': 14731, 'loss/train': 1.7061964273452759} +11/06/2021 23:16:47 - INFO - __main__ - Step 14733: {'lr': 0.0004909252531815388, 'samples': 2828736, 'steps': 14732, 'loss/train': 1.6438379287719727} +11/06/2021 23:16:48 - INFO - __main__ - Step 14734: {'lr': 0.0004909238363124033, 'samples': 2828928, 'steps': 14733, 'loss/train': 1.719048023223877} +11/06/2021 23:16:49 - INFO - __main__ - Step 14735: {'lr': 0.0004909224193347112, 'samples': 2829120, 'steps': 14734, 'loss/train': 1.9832409620285034} +11/06/2021 23:16:49 - INFO - __main__ - Step 14736: {'lr': 0.0004909210022484633, 'samples': 2829312, 'steps': 14735, 'loss/train': 2.6759371757507324} +11/06/2021 23:16:49 - INFO - __main__ - Step 14737: {'lr': 0.00049091958505366, 'samples': 2829504, 'steps': 14736, 'loss/train': 1.7943952083587646} +11/06/2021 23:16:50 - INFO - __main__ - Step 14738: {'lr': 0.000490918167750302, 'samples': 2829696, 'steps': 14737, 'loss/train': 1.9066545963287354} +11/06/2021 23:16:50 - INFO - __main__ - Step 14739: {'lr': 0.00049091675033839, 'samples': 2829888, 'steps': 14738, 'loss/train': 1.0074669122695923} +11/06/2021 23:16:51 - INFO - __main__ - Step 14740: {'lr': 0.0004909153328179248, 'samples': 2830080, 'steps': 14739, 'loss/train': 1.9582070112228394} +11/06/2021 23:16:51 - INFO - __main__ - Step 14741: {'lr': 0.0004909139151889067, 'samples': 2830272, 'steps': 14740, 'loss/train': 2.478091239929199} +11/06/2021 23:16:52 - INFO - __main__ - Step 14742: {'lr': 0.0004909124974513366, 'samples': 2830464, 'steps': 14741, 'loss/train': 1.6102755069732666} +11/06/2021 23:16:52 - INFO - __main__ - Step 14743: {'lr': 0.000490911079605215, 'samples': 2830656, 'steps': 14742, 'loss/train': 1.9308674335479736} +11/06/2021 23:16:53 - INFO - __main__ - Step 14744: {'lr': 0.0004909096616505426, 'samples': 2830848, 'steps': 14743, 'loss/train': 1.605130672454834} +11/06/2021 23:16:53 - INFO - __main__ - Step 14745: {'lr': 0.00049090824358732, 'samples': 2831040, 'steps': 14744, 'loss/train': 1.5920521020889282} +11/06/2021 23:16:54 - INFO - __main__ - Step 14746: {'lr': 0.0004909068254155479, 'samples': 2831232, 'steps': 14745, 'loss/train': 1.7607147693634033} +11/06/2021 23:16:55 - INFO - __main__ - Step 14747: {'lr': 0.0004909054071352269, 'samples': 2831424, 'steps': 14746, 'loss/train': 1.231070876121521} +11/06/2021 23:16:55 - INFO - __main__ - Step 14748: {'lr': 0.0004909039887463576, 'samples': 2831616, 'steps': 14747, 'loss/train': 1.5784339904785156} +11/06/2021 23:16:55 - INFO - __main__ - Step 14749: {'lr': 0.0004909025702489407, 'samples': 2831808, 'steps': 14748, 'loss/train': 0.686924934387207} +11/06/2021 23:16:56 - INFO - __main__ - Step 14750: {'lr': 0.0004909011516429768, 'samples': 2832000, 'steps': 14749, 'loss/train': 1.3042925596237183} +11/06/2021 23:16:57 - INFO - __main__ - Step 14751: {'lr': 0.0004908997329284667, 'samples': 2832192, 'steps': 14750, 'loss/train': 1.7104178667068481} +11/06/2021 23:16:57 - INFO - __main__ - Step 14752: {'lr': 0.0004908983141054107, 'samples': 2832384, 'steps': 14751, 'loss/train': 1.4332627058029175} +11/06/2021 23:16:57 - INFO - __main__ - Step 14753: {'lr': 0.0004908968951738098, 'samples': 2832576, 'steps': 14752, 'loss/train': 2.133230209350586} +11/06/2021 23:16:58 - INFO - __main__ - Step 14754: {'lr': 0.0004908954761336643, 'samples': 2832768, 'steps': 14753, 'loss/train': 1.732865333557129} +11/06/2021 23:16:58 - INFO - __main__ - Step 14755: {'lr': 0.0004908940569849751, 'samples': 2832960, 'steps': 14754, 'loss/train': 1.9178493022918701} +11/06/2021 23:16:59 - INFO - __main__ - Step 14756: {'lr': 0.0004908926377277428, 'samples': 2833152, 'steps': 14755, 'loss/train': 1.5390150547027588} +11/06/2021 23:16:59 - INFO - __main__ - Step 14757: {'lr': 0.000490891218361968, 'samples': 2833344, 'steps': 14756, 'loss/train': 1.8167674541473389} +11/06/2021 23:17:00 - INFO - __main__ - Step 14758: {'lr': 0.0004908897988876512, 'samples': 2833536, 'steps': 14757, 'loss/train': 1.5798640251159668} +11/06/2021 23:17:00 - INFO - __main__ - Step 14759: {'lr': 0.0004908883793047934, 'samples': 2833728, 'steps': 14758, 'loss/train': 1.2919437885284424} +11/06/2021 23:17:01 - INFO - __main__ - Step 14760: {'lr': 0.0004908869596133948, 'samples': 2833920, 'steps': 14759, 'loss/train': 2.303706407546997} +11/06/2021 23:17:01 - INFO - __main__ - Step 14761: {'lr': 0.0004908855398134563, 'samples': 2834112, 'steps': 14760, 'loss/train': 1.3456342220306396} +11/06/2021 23:17:02 - INFO - __main__ - Step 14762: {'lr': 0.0004908841199049785, 'samples': 2834304, 'steps': 14761, 'loss/train': 1.4965943098068237} +11/06/2021 23:17:02 - INFO - __main__ - Step 14763: {'lr': 0.0004908826998879621, 'samples': 2834496, 'steps': 14762, 'loss/train': 1.7584352493286133} +11/06/2021 23:17:03 - INFO - __main__ - Step 14764: {'lr': 0.0004908812797624077, 'samples': 2834688, 'steps': 14763, 'loss/train': 1.936519980430603} +11/06/2021 23:17:03 - INFO - __main__ - Step 14765: {'lr': 0.0004908798595283159, 'samples': 2834880, 'steps': 14764, 'loss/train': 2.077310562133789} +11/06/2021 23:17:03 - INFO - __main__ - Step 14766: {'lr': 0.0004908784391856872, 'samples': 2835072, 'steps': 14765, 'loss/train': 1.6648650169372559} +11/06/2021 23:17:05 - INFO - __main__ - Step 14767: {'lr': 0.0004908770187345225, 'samples': 2835264, 'steps': 14766, 'loss/train': 1.7535183429718018} +11/06/2021 23:17:05 - INFO - __main__ - Step 14768: {'lr': 0.0004908755981748223, 'samples': 2835456, 'steps': 14767, 'loss/train': 1.9513096809387207} +11/06/2021 23:17:05 - INFO - __main__ - Step 14769: {'lr': 0.0004908741775065873, 'samples': 2835648, 'steps': 14768, 'loss/train': 2.233029365539551} +11/06/2021 23:17:06 - INFO - __main__ - Step 14770: {'lr': 0.0004908727567298181, 'samples': 2835840, 'steps': 14769, 'loss/train': 1.4736902713775635} +11/06/2021 23:17:06 - INFO - __main__ - Step 14771: {'lr': 0.0004908713358445154, 'samples': 2836032, 'steps': 14770, 'loss/train': 5.864256381988525} +11/06/2021 23:17:06 - INFO - __main__ - Step 14772: {'lr': 0.0004908699148506797, 'samples': 2836224, 'steps': 14771, 'loss/train': 1.9193412065505981} +11/06/2021 23:17:07 - INFO - __main__ - Step 14773: {'lr': 0.0004908684937483119, 'samples': 2836416, 'steps': 14772, 'loss/train': 1.799191951751709} +11/06/2021 23:17:08 - INFO - __main__ - Step 14774: {'lr': 0.0004908670725374122, 'samples': 2836608, 'steps': 14773, 'loss/train': 1.3834148645401} +11/06/2021 23:17:08 - INFO - __main__ - Step 14775: {'lr': 0.0004908656512179817, 'samples': 2836800, 'steps': 14774, 'loss/train': 1.5654276609420776} +11/06/2021 23:17:08 - INFO - __main__ - Step 14776: {'lr': 0.0004908642297900209, 'samples': 2836992, 'steps': 14775, 'loss/train': 1.6006273031234741} +11/06/2021 23:17:09 - INFO - __main__ - Step 14777: {'lr': 0.0004908628082535303, 'samples': 2837184, 'steps': 14776, 'loss/train': 1.8874455690383911} +11/06/2021 23:17:10 - INFO - __main__ - Step 14778: {'lr': 0.0004908613866085106, 'samples': 2837376, 'steps': 14777, 'loss/train': 1.3304411172866821} +11/06/2021 23:17:10 - INFO - __main__ - Step 14779: {'lr': 0.0004908599648549626, 'samples': 2837568, 'steps': 14778, 'loss/train': 1.500115990638733} +11/06/2021 23:17:11 - INFO - __main__ - Step 14780: {'lr': 0.0004908585429928867, 'samples': 2837760, 'steps': 14779, 'loss/train': 1.748668909072876} +11/06/2021 23:17:11 - INFO - __main__ - Step 14781: {'lr': 0.0004908571210222837, 'samples': 2837952, 'steps': 14780, 'loss/train': 1.470587968826294} +11/06/2021 23:17:11 - INFO - __main__ - Step 14782: {'lr': 0.0004908556989431543, 'samples': 2838144, 'steps': 14781, 'loss/train': 0.8396479487419128} +11/06/2021 23:17:12 - INFO - __main__ - Step 14783: {'lr': 0.0004908542767554988, 'samples': 2838336, 'steps': 14782, 'loss/train': 1.8558242321014404} +11/06/2021 23:17:13 - INFO - __main__ - Step 14784: {'lr': 0.0004908528544593184, 'samples': 2838528, 'steps': 14783, 'loss/train': 1.9126049280166626} +11/06/2021 23:17:13 - INFO - __main__ - Step 14785: {'lr': 0.0004908514320546132, 'samples': 2838720, 'steps': 14784, 'loss/train': 1.7966852188110352} +11/06/2021 23:17:13 - INFO - __main__ - Step 14786: {'lr': 0.000490850009541384, 'samples': 2838912, 'steps': 14785, 'loss/train': 1.829959750175476} +11/06/2021 23:17:14 - INFO - __main__ - Step 14787: {'lr': 0.0004908485869196317, 'samples': 2839104, 'steps': 14786, 'loss/train': 1.6409757137298584} +11/06/2021 23:17:15 - INFO - __main__ - Step 14788: {'lr': 0.0004908471641893566, 'samples': 2839296, 'steps': 14787, 'loss/train': 1.4668761491775513} +11/06/2021 23:17:15 - INFO - __main__ - Step 14789: {'lr': 0.0004908457413505596, 'samples': 2839488, 'steps': 14788, 'loss/train': 1.7249447107315063} +11/06/2021 23:17:16 - INFO - __main__ - Step 14790: {'lr': 0.0004908443184032411, 'samples': 2839680, 'steps': 14789, 'loss/train': 1.671472430229187} +11/06/2021 23:17:16 - INFO - __main__ - Step 14791: {'lr': 0.0004908428953474019, 'samples': 2839872, 'steps': 14790, 'loss/train': 1.2302889823913574} +11/06/2021 23:17:16 - INFO - __main__ - Step 14792: {'lr': 0.0004908414721830427, 'samples': 2840064, 'steps': 14791, 'loss/train': 1.5707032680511475} +11/06/2021 23:17:17 - INFO - __main__ - Step 14793: {'lr': 0.000490840048910164, 'samples': 2840256, 'steps': 14792, 'loss/train': 1.8218657970428467} +11/06/2021 23:17:18 - INFO - __main__ - Step 14794: {'lr': 0.0004908386255287664, 'samples': 2840448, 'steps': 14793, 'loss/train': 2.0798017978668213} +11/06/2021 23:17:18 - INFO - __main__ - Step 14795: {'lr': 0.0004908372020388508, 'samples': 2840640, 'steps': 14794, 'loss/train': 1.7213116884231567} +11/06/2021 23:17:18 - INFO - __main__ - Step 14796: {'lr': 0.0004908357784404175, 'samples': 2840832, 'steps': 14795, 'loss/train': 1.5220595598220825} +11/06/2021 23:17:19 - INFO - __main__ - Step 14797: {'lr': 0.0004908343547334674, 'samples': 2841024, 'steps': 14796, 'loss/train': 1.586082100868225} +11/06/2021 23:17:19 - INFO - __main__ - Step 14798: {'lr': 0.0004908329309180011, 'samples': 2841216, 'steps': 14797, 'loss/train': 2.087536573410034} +11/06/2021 23:17:20 - INFO - __main__ - Step 14799: {'lr': 0.0004908315069940191, 'samples': 2841408, 'steps': 14798, 'loss/train': 1.841811180114746} +11/06/2021 23:17:20 - INFO - __main__ - Step 14800: {'lr': 0.0004908300829615222, 'samples': 2841600, 'steps': 14799, 'loss/train': 1.4489543437957764} +11/06/2021 23:17:21 - INFO - __main__ - Step 14801: {'lr': 0.000490828658820511, 'samples': 2841792, 'steps': 14800, 'loss/train': 1.7258611917495728} +11/06/2021 23:17:21 - INFO - __main__ - Step 14802: {'lr': 0.0004908272345709861, 'samples': 2841984, 'steps': 14801, 'loss/train': 1.824029564857483} +11/06/2021 23:17:21 - INFO - __main__ - Step 14803: {'lr': 0.0004908258102129481, 'samples': 2842176, 'steps': 14802, 'loss/train': 1.134230375289917} +11/06/2021 23:17:23 - INFO - __main__ - Step 14804: {'lr': 0.0004908243857463978, 'samples': 2842368, 'steps': 14803, 'loss/train': 1.6424596309661865} +11/06/2021 23:17:23 - INFO - __main__ - Step 14805: {'lr': 0.0004908229611713357, 'samples': 2842560, 'steps': 14804, 'loss/train': 1.7975839376449585} +11/06/2021 23:17:23 - INFO - __main__ - Step 14806: {'lr': 0.0004908215364877625, 'samples': 2842752, 'steps': 14805, 'loss/train': 1.8489753007888794} +11/06/2021 23:17:24 - INFO - __main__ - Step 14807: {'lr': 0.0004908201116956788, 'samples': 2842944, 'steps': 14806, 'loss/train': 4.51678466796875} +11/06/2021 23:17:24 - INFO - __main__ - Step 14808: {'lr': 0.0004908186867950854, 'samples': 2843136, 'steps': 14807, 'loss/train': 1.53168785572052} +11/06/2021 23:17:24 - INFO - __main__ - Step 14809: {'lr': 0.0004908172617859826, 'samples': 2843328, 'steps': 14808, 'loss/train': 1.772919774055481} +11/06/2021 23:17:25 - INFO - __main__ - Step 14810: {'lr': 0.0004908158366683714, 'samples': 2843520, 'steps': 14809, 'loss/train': 2.220637798309326} +11/06/2021 23:17:26 - INFO - __main__ - Step 14811: {'lr': 0.0004908144114422523, 'samples': 2843712, 'steps': 14810, 'loss/train': 0.5302165150642395} +11/06/2021 23:17:26 - INFO - __main__ - Step 14812: {'lr': 0.000490812986107626, 'samples': 2843904, 'steps': 14811, 'loss/train': 1.51813542842865} +11/06/2021 23:17:26 - INFO - __main__ - Step 14813: {'lr': 0.000490811560664493, 'samples': 2844096, 'steps': 14812, 'loss/train': 1.3996822834014893} +11/06/2021 23:17:27 - INFO - __main__ - Step 14814: {'lr': 0.000490810135112854, 'samples': 2844288, 'steps': 14813, 'loss/train': 1.816659688949585} +11/06/2021 23:17:28 - INFO - __main__ - Step 14815: {'lr': 0.0004908087094527097, 'samples': 2844480, 'steps': 14814, 'loss/train': 1.3649659156799316} +11/06/2021 23:17:28 - INFO - __main__ - Step 14816: {'lr': 0.0004908072836840607, 'samples': 2844672, 'steps': 14815, 'loss/train': 1.6869769096374512} +11/06/2021 23:17:29 - INFO - __main__ - Step 14817: {'lr': 0.0004908058578069077, 'samples': 2844864, 'steps': 14816, 'loss/train': 1.6598951816558838} +11/06/2021 23:17:29 - INFO - __main__ - Step 14818: {'lr': 0.0004908044318212512, 'samples': 2845056, 'steps': 14817, 'loss/train': 1.5969890356063843} +11/06/2021 23:17:29 - INFO - __main__ - Step 14819: {'lr': 0.000490803005727092, 'samples': 2845248, 'steps': 14818, 'loss/train': 1.8578797578811646} +11/06/2021 23:17:30 - INFO - __main__ - Step 14820: {'lr': 0.0004908015795244307, 'samples': 2845440, 'steps': 14819, 'loss/train': 1.8108375072479248} +11/06/2021 23:17:31 - INFO - __main__ - Step 14821: {'lr': 0.0004908001532132679, 'samples': 2845632, 'steps': 14820, 'loss/train': 1.6355654001235962} +11/06/2021 23:17:31 - INFO - __main__ - Step 14822: {'lr': 0.0004907987267936042, 'samples': 2845824, 'steps': 14821, 'loss/train': 1.8750498294830322} +11/06/2021 23:17:31 - INFO - __main__ - Step 14823: {'lr': 0.0004907973002654404, 'samples': 2846016, 'steps': 14822, 'loss/train': 1.708099603652954} +11/06/2021 23:17:32 - INFO - __main__ - Step 14824: {'lr': 0.0004907958736287771, 'samples': 2846208, 'steps': 14823, 'loss/train': 1.5635958909988403} +11/06/2021 23:17:33 - INFO - __main__ - Step 14825: {'lr': 0.0004907944468836148, 'samples': 2846400, 'steps': 14824, 'loss/train': 3.393544912338257} +11/06/2021 23:17:33 - INFO - __main__ - Step 14826: {'lr': 0.0004907930200299543, 'samples': 2846592, 'steps': 14825, 'loss/train': 1.548439383506775} +11/06/2021 23:17:33 - INFO - __main__ - Step 14827: {'lr': 0.0004907915930677961, 'samples': 2846784, 'steps': 14826, 'loss/train': 1.3716732263565063} +11/06/2021 23:17:34 - INFO - __main__ - Step 14828: {'lr': 0.000490790165997141, 'samples': 2846976, 'steps': 14827, 'loss/train': 1.7341458797454834} +11/06/2021 23:17:34 - INFO - __main__ - Step 14829: {'lr': 0.0004907887388179896, 'samples': 2847168, 'steps': 14828, 'loss/train': 1.6612669229507446} +11/06/2021 23:17:35 - INFO - __main__ - Step 14830: {'lr': 0.0004907873115303424, 'samples': 2847360, 'steps': 14829, 'loss/train': 1.5637840032577515} +11/06/2021 23:17:36 - INFO - __main__ - Step 14831: {'lr': 0.0004907858841342002, 'samples': 2847552, 'steps': 14830, 'loss/train': 1.3963515758514404} +11/06/2021 23:17:36 - INFO - __main__ - Step 14832: {'lr': 0.0004907844566295637, 'samples': 2847744, 'steps': 14831, 'loss/train': 1.5587491989135742} +11/06/2021 23:17:36 - INFO - __main__ - Step 14833: {'lr': 0.0004907830290164332, 'samples': 2847936, 'steps': 14832, 'loss/train': 1.662847638130188} +11/06/2021 23:17:37 - INFO - __main__ - Step 14834: {'lr': 0.0004907816012948098, 'samples': 2848128, 'steps': 14833, 'loss/train': 2.050675630569458} +11/06/2021 23:17:37 - INFO - __main__ - Step 14835: {'lr': 0.0004907801734646938, 'samples': 2848320, 'steps': 14834, 'loss/train': 1.9373985528945923} +11/06/2021 23:17:38 - INFO - __main__ - Step 14836: {'lr': 0.000490778745526086, 'samples': 2848512, 'steps': 14835, 'loss/train': 1.7804934978485107} +11/06/2021 23:17:38 - INFO - __main__ - Step 14837: {'lr': 0.000490777317478987, 'samples': 2848704, 'steps': 14836, 'loss/train': 1.345388412475586} +11/06/2021 23:17:39 - INFO - __main__ - Step 14838: {'lr': 0.0004907758893233975, 'samples': 2848896, 'steps': 14837, 'loss/train': 1.093638300895691} +11/06/2021 23:17:39 - INFO - __main__ - Step 14839: {'lr': 0.0004907744610593181, 'samples': 2849088, 'steps': 14838, 'loss/train': 1.936640739440918} +11/06/2021 23:17:39 - INFO - __main__ - Step 14840: {'lr': 0.0004907730326867495, 'samples': 2849280, 'steps': 14839, 'loss/train': 1.6983401775360107} +11/06/2021 23:17:40 - INFO - __main__ - Step 14841: {'lr': 0.0004907716042056921, 'samples': 2849472, 'steps': 14840, 'loss/train': 2.199077844619751} +11/06/2021 23:17:41 - INFO - __main__ - Step 14842: {'lr': 0.0004907701756161469, 'samples': 2849664, 'steps': 14841, 'loss/train': 2.0116066932678223} +11/06/2021 23:17:41 - INFO - __main__ - Step 14843: {'lr': 0.0004907687469181143, 'samples': 2849856, 'steps': 14842, 'loss/train': 1.461774230003357} +11/06/2021 23:17:41 - INFO - __main__ - Step 14844: {'lr': 0.000490767318111595, 'samples': 2850048, 'steps': 14843, 'loss/train': 1.6642917394638062} +11/06/2021 23:17:42 - INFO - __main__ - Step 14845: {'lr': 0.0004907658891965897, 'samples': 2850240, 'steps': 14844, 'loss/train': 1.9356948137283325} +11/06/2021 23:17:43 - INFO - __main__ - Step 14846: {'lr': 0.000490764460173099, 'samples': 2850432, 'steps': 14845, 'loss/train': 1.7684423923492432} +11/06/2021 23:17:43 - INFO - __main__ - Step 14847: {'lr': 0.0004907630310411236, 'samples': 2850624, 'steps': 14846, 'loss/train': 1.5917563438415527} +11/06/2021 23:17:43 - INFO - __main__ - Step 14848: {'lr': 0.000490761601800664, 'samples': 2850816, 'steps': 14847, 'loss/train': 1.7513176202774048} +11/06/2021 23:17:44 - INFO - __main__ - Step 14849: {'lr': 0.000490760172451721, 'samples': 2851008, 'steps': 14848, 'loss/train': 1.5119004249572754} +11/06/2021 23:17:44 - INFO - __main__ - Step 14850: {'lr': 0.0004907587429942952, 'samples': 2851200, 'steps': 14849, 'loss/train': 2.091411590576172} +11/06/2021 23:17:45 - INFO - __main__ - Step 14851: {'lr': 0.0004907573134283872, 'samples': 2851392, 'steps': 14850, 'loss/train': 1.808640718460083} +11/06/2021 23:17:45 - INFO - __main__ - Step 14852: {'lr': 0.0004907558837539976, 'samples': 2851584, 'steps': 14851, 'loss/train': 1.7864621877670288} +11/06/2021 23:17:46 - INFO - __main__ - Step 14853: {'lr': 0.0004907544539711272, 'samples': 2851776, 'steps': 14852, 'loss/train': 1.476940631866455} +11/06/2021 23:17:46 - INFO - __main__ - Step 14854: {'lr': 0.0004907530240797765, 'samples': 2851968, 'steps': 14853, 'loss/train': 1.674166202545166} +11/06/2021 23:17:47 - INFO - __main__ - Step 14855: {'lr': 0.0004907515940799463, 'samples': 2852160, 'steps': 14854, 'loss/train': 1.497134804725647} +11/06/2021 23:17:48 - INFO - __main__ - Step 14856: {'lr': 0.000490750163971637, 'samples': 2852352, 'steps': 14855, 'loss/train': 1.8654690980911255} +11/06/2021 23:17:48 - INFO - __main__ - Step 14857: {'lr': 0.0004907487337548495, 'samples': 2852544, 'steps': 14856, 'loss/train': 1.693071722984314} +11/06/2021 23:17:49 - INFO - __main__ - Step 14858: {'lr': 0.0004907473034295843, 'samples': 2852736, 'steps': 14857, 'loss/train': 1.270855188369751} +11/06/2021 23:17:49 - INFO - __main__ - Step 14859: {'lr': 0.0004907458729958422, 'samples': 2852928, 'steps': 14858, 'loss/train': 1.4801957607269287} +11/06/2021 23:17:49 - INFO - __main__ - Step 14860: {'lr': 0.0004907444424536235, 'samples': 2853120, 'steps': 14859, 'loss/train': 1.5060356855392456} +11/06/2021 23:17:50 - INFO - __main__ - Step 14861: {'lr': 0.0004907430118029293, 'samples': 2853312, 'steps': 14860, 'loss/train': 1.8055636882781982} +11/06/2021 23:17:51 - INFO - __main__ - Step 14862: {'lr': 0.0004907415810437598, 'samples': 2853504, 'steps': 14861, 'loss/train': 1.6325714588165283} +11/06/2021 23:17:51 - INFO - __main__ - Step 14863: {'lr': 0.0004907401501761159, 'samples': 2853696, 'steps': 14862, 'loss/train': 1.5240354537963867} +11/06/2021 23:17:51 - INFO - __main__ - Step 14864: {'lr': 0.0004907387191999984, 'samples': 2853888, 'steps': 14863, 'loss/train': 1.4284332990646362} +11/06/2021 23:17:52 - INFO - __main__ - Step 14865: {'lr': 0.0004907372881154075, 'samples': 2854080, 'steps': 14864, 'loss/train': 1.6523523330688477} +11/06/2021 23:17:53 - INFO - __main__ - Step 14866: {'lr': 0.0004907358569223442, 'samples': 2854272, 'steps': 14865, 'loss/train': 1.5434261560440063} +11/06/2021 23:17:53 - INFO - __main__ - Step 14867: {'lr': 0.000490734425620809, 'samples': 2854464, 'steps': 14866, 'loss/train': 1.671189785003662} +11/06/2021 23:17:53 - INFO - __main__ - Step 14868: {'lr': 0.0004907329942108027, 'samples': 2854656, 'steps': 14867, 'loss/train': 1.6853291988372803} +11/06/2021 23:17:54 - INFO - __main__ - Step 14869: {'lr': 0.0004907315626923258, 'samples': 2854848, 'steps': 14868, 'loss/train': 1.1505197286605835} +11/06/2021 23:17:54 - INFO - __main__ - Step 14870: {'lr': 0.0004907301310653789, 'samples': 2855040, 'steps': 14869, 'loss/train': 1.6277196407318115} +11/06/2021 23:17:55 - INFO - __main__ - Step 14871: {'lr': 0.0004907286993299627, 'samples': 2855232, 'steps': 14870, 'loss/train': 2.135899305343628} +11/06/2021 23:17:56 - INFO - __main__ - Step 14872: {'lr': 0.0004907272674860779, 'samples': 2855424, 'steps': 14871, 'loss/train': 2.0826239585876465} +11/06/2021 23:17:56 - INFO - __main__ - Step 14873: {'lr': 0.0004907258355337251, 'samples': 2855616, 'steps': 14872, 'loss/train': 1.8687199354171753} +11/06/2021 23:17:56 - INFO - __main__ - Step 14874: {'lr': 0.0004907244034729049, 'samples': 2855808, 'steps': 14873, 'loss/train': 1.6615655422210693} +11/06/2021 23:17:57 - INFO - __main__ - Step 14875: {'lr': 0.0004907229713036181, 'samples': 2856000, 'steps': 14874, 'loss/train': 1.7533270120620728} +11/06/2021 23:17:57 - INFO - __main__ - Step 14876: {'lr': 0.0004907215390258652, 'samples': 2856192, 'steps': 14875, 'loss/train': 1.654037356376648} +11/06/2021 23:17:58 - INFO - __main__ - Step 14877: {'lr': 0.0004907201066396469, 'samples': 2856384, 'steps': 14876, 'loss/train': 1.8480337858200073} +11/06/2021 23:17:58 - INFO - __main__ - Step 14878: {'lr': 0.0004907186741449638, 'samples': 2856576, 'steps': 14877, 'loss/train': 1.6371917724609375} +11/06/2021 23:17:59 - INFO - __main__ - Step 14879: {'lr': 0.0004907172415418166, 'samples': 2856768, 'steps': 14878, 'loss/train': 1.5165156126022339} +11/06/2021 23:17:59 - INFO - __main__ - Step 14880: {'lr': 0.0004907158088302059, 'samples': 2856960, 'steps': 14879, 'loss/train': 1.6989234685897827} +11/06/2021 23:17:59 - INFO - __main__ - Step 14881: {'lr': 0.0004907143760101325, 'samples': 2857152, 'steps': 14880, 'loss/train': 1.368466854095459} +11/06/2021 23:18:01 - INFO - __main__ - Step 14882: {'lr': 0.0004907129430815968, 'samples': 2857344, 'steps': 14881, 'loss/train': 1.8604637384414673} +11/06/2021 23:18:01 - INFO - __main__ - Step 14883: {'lr': 0.0004907115100445996, 'samples': 2857536, 'steps': 14882, 'loss/train': 1.6678239107131958} +11/06/2021 23:18:01 - INFO - __main__ - Step 14884: {'lr': 0.0004907100768991415, 'samples': 2857728, 'steps': 14883, 'loss/train': 2.169818878173828} +11/06/2021 23:18:02 - INFO - __main__ - Step 14885: {'lr': 0.0004907086436452231, 'samples': 2857920, 'steps': 14884, 'loss/train': 1.5355026721954346} +11/06/2021 23:18:02 - INFO - __main__ - Step 14886: {'lr': 0.0004907072102828451, 'samples': 2858112, 'steps': 14885, 'loss/train': 1.5460067987442017} +11/06/2021 23:18:03 - INFO - __main__ - Step 14887: {'lr': 0.0004907057768120082, 'samples': 2858304, 'steps': 14886, 'loss/train': 1.5537009239196777} +11/06/2021 23:18:03 - INFO - __main__ - Step 14888: {'lr': 0.000490704343232713, 'samples': 2858496, 'steps': 14887, 'loss/train': 1.7863291501998901} +11/06/2021 23:18:04 - INFO - __main__ - Step 14889: {'lr': 0.0004907029095449602, 'samples': 2858688, 'steps': 14888, 'loss/train': 1.847086787223816} +11/06/2021 23:18:04 - INFO - __main__ - Step 14890: {'lr': 0.0004907014757487503, 'samples': 2858880, 'steps': 14889, 'loss/train': 1.9282914400100708} +11/06/2021 23:18:04 - INFO - __main__ - Step 14891: {'lr': 0.0004907000418440839, 'samples': 2859072, 'steps': 14890, 'loss/train': 1.711198091506958} +11/06/2021 23:18:05 - INFO - __main__ - Step 14892: {'lr': 0.000490698607830962, 'samples': 2859264, 'steps': 14891, 'loss/train': 1.5940576791763306} +11/06/2021 23:18:06 - INFO - __main__ - Step 14893: {'lr': 0.0004906971737093849, 'samples': 2859456, 'steps': 14892, 'loss/train': 1.9280325174331665} +11/06/2021 23:18:06 - INFO - __main__ - Step 14894: {'lr': 0.0004906957394793534, 'samples': 2859648, 'steps': 14893, 'loss/train': 1.427196979522705} +11/06/2021 23:18:06 - INFO - __main__ - Step 14895: {'lr': 0.0004906943051408682, 'samples': 2859840, 'steps': 14894, 'loss/train': 1.3355380296707153} +11/06/2021 23:18:07 - INFO - __main__ - Step 14896: {'lr': 0.0004906928706939296, 'samples': 2860032, 'steps': 14895, 'loss/train': 1.7179498672485352} +11/06/2021 23:18:08 - INFO - __main__ - Step 14897: {'lr': 0.0004906914361385387, 'samples': 2860224, 'steps': 14896, 'loss/train': 1.7625758647918701} +11/06/2021 23:18:08 - INFO - __main__ - Step 14898: {'lr': 0.0004906900014746959, 'samples': 2860416, 'steps': 14897, 'loss/train': 1.622707724571228} +11/06/2021 23:18:09 - INFO - __main__ - Step 14899: {'lr': 0.000490688566702402, 'samples': 2860608, 'steps': 14898, 'loss/train': 1.7065162658691406} +11/06/2021 23:18:09 - INFO - __main__ - Step 14900: {'lr': 0.0004906871318216575, 'samples': 2860800, 'steps': 14899, 'loss/train': 1.6930841207504272} +11/06/2021 23:18:09 - INFO - __main__ - Step 14901: {'lr': 0.000490685696832463, 'samples': 2860992, 'steps': 14900, 'loss/train': 1.9356876611709595} +11/06/2021 23:18:10 - INFO - __main__ - Step 14902: {'lr': 0.0004906842617348193, 'samples': 2861184, 'steps': 14901, 'loss/train': 1.8025461435317993} +11/06/2021 23:18:11 - INFO - __main__ - Step 14903: {'lr': 0.000490682826528727, 'samples': 2861376, 'steps': 14902, 'loss/train': 1.7793097496032715} +11/06/2021 23:18:11 - INFO - __main__ - Step 14904: {'lr': 0.0004906813912141868, 'samples': 2861568, 'steps': 14903, 'loss/train': 2.1294806003570557} +11/06/2021 23:18:11 - INFO - __main__ - Step 14905: {'lr': 0.0004906799557911992, 'samples': 2861760, 'steps': 14904, 'loss/train': 1.366396427154541} +11/06/2021 23:18:12 - INFO - __main__ - Step 14906: {'lr': 0.0004906785202597649, 'samples': 2861952, 'steps': 14905, 'loss/train': 1.2872095108032227} +11/06/2021 23:18:13 - INFO - __main__ - Step 14907: {'lr': 0.0004906770846198846, 'samples': 2862144, 'steps': 14906, 'loss/train': 1.8077151775360107} +11/06/2021 23:18:13 - INFO - __main__ - Step 14908: {'lr': 0.0004906756488715589, 'samples': 2862336, 'steps': 14907, 'loss/train': 1.617505669593811} +11/06/2021 23:18:14 - INFO - __main__ - Step 14909: {'lr': 0.0004906742130147884, 'samples': 2862528, 'steps': 14908, 'loss/train': 1.6927767992019653} +11/06/2021 23:18:14 - INFO - __main__ - Step 14910: {'lr': 0.0004906727770495739, 'samples': 2862720, 'steps': 14909, 'loss/train': 1.645467758178711} +11/06/2021 23:18:14 - INFO - __main__ - Step 14911: {'lr': 0.000490671340975916, 'samples': 2862912, 'steps': 14910, 'loss/train': 1.7554125785827637} +11/06/2021 23:18:15 - INFO - __main__ - Step 14912: {'lr': 0.0004906699047938153, 'samples': 2863104, 'steps': 14911, 'loss/train': 1.9322426319122314} +11/06/2021 23:18:16 - INFO - __main__ - Step 14913: {'lr': 0.0004906684685032724, 'samples': 2863296, 'steps': 14912, 'loss/train': 0.9366849064826965} +11/06/2021 23:18:16 - INFO - __main__ - Step 14914: {'lr': 0.0004906670321042881, 'samples': 2863488, 'steps': 14913, 'loss/train': 1.394436240196228} +11/06/2021 23:18:16 - INFO - __main__ - Step 14915: {'lr': 0.0004906655955968628, 'samples': 2863680, 'steps': 14914, 'loss/train': 1.2023478746414185} +11/06/2021 23:18:17 - INFO - __main__ - Step 14916: {'lr': 0.0004906641589809973, 'samples': 2863872, 'steps': 14915, 'loss/train': 2.0545525550842285} +11/06/2021 23:18:17 - INFO - __main__ - Step 14917: {'lr': 0.0004906627222566924, 'samples': 2864064, 'steps': 14916, 'loss/train': 1.4498852491378784} +11/06/2021 23:18:18 - INFO - __main__ - Step 14918: {'lr': 0.0004906612854239485, 'samples': 2864256, 'steps': 14917, 'loss/train': 1.5706671476364136} +11/06/2021 23:18:19 - INFO - __main__ - Step 14919: {'lr': 0.0004906598484827663, 'samples': 2864448, 'steps': 14918, 'loss/train': 1.427777647972107} +11/06/2021 23:18:19 - INFO - __main__ - Step 14920: {'lr': 0.0004906584114331465, 'samples': 2864640, 'steps': 14919, 'loss/train': 1.9566161632537842} +11/06/2021 23:18:19 - INFO - __main__ - Step 14921: {'lr': 0.0004906569742750899, 'samples': 2864832, 'steps': 14920, 'loss/train': 1.7183939218521118} +11/06/2021 23:18:20 - INFO - __main__ - Step 14922: {'lr': 0.0004906555370085968, 'samples': 2865024, 'steps': 14921, 'loss/train': 1.8103671073913574} +11/06/2021 23:18:21 - INFO - __main__ - Step 14923: {'lr': 0.000490654099633668, 'samples': 2865216, 'steps': 14922, 'loss/train': 1.5817921161651611} +11/06/2021 23:18:21 - INFO - __main__ - Step 14924: {'lr': 0.0004906526621503043, 'samples': 2865408, 'steps': 14923, 'loss/train': 1.145911455154419} +11/06/2021 23:18:21 - INFO - __main__ - Step 14925: {'lr': 0.0004906512245585062, 'samples': 2865600, 'steps': 14924, 'loss/train': 2.2841901779174805} +11/06/2021 23:18:22 - INFO - __main__ - Step 14926: {'lr': 0.0004906497868582743, 'samples': 2865792, 'steps': 14925, 'loss/train': 1.4507989883422852} +11/06/2021 23:18:22 - INFO - __main__ - Step 14927: {'lr': 0.0004906483490496093, 'samples': 2865984, 'steps': 14926, 'loss/train': 1.791601538658142} +11/06/2021 23:18:23 - INFO - __main__ - Step 14928: {'lr': 0.000490646911132512, 'samples': 2866176, 'steps': 14927, 'loss/train': 1.7833375930786133} +11/06/2021 23:18:23 - INFO - __main__ - Step 14929: {'lr': 0.0004906454731069828, 'samples': 2866368, 'steps': 14928, 'loss/train': 1.2282170057296753} +11/06/2021 23:18:24 - INFO - __main__ - Step 14930: {'lr': 0.0004906440349730226, 'samples': 2866560, 'steps': 14929, 'loss/train': 1.1155771017074585} +11/06/2021 23:18:24 - INFO - __main__ - Step 14931: {'lr': 0.0004906425967306317, 'samples': 2866752, 'steps': 14930, 'loss/train': 1.8701684474945068} +11/06/2021 23:18:24 - INFO - __main__ - Step 14932: {'lr': 0.0004906411583798112, 'samples': 2866944, 'steps': 14931, 'loss/train': 1.1279278993606567} +11/06/2021 23:18:26 - INFO - __main__ - Step 14933: {'lr': 0.0004906397199205614, 'samples': 2867136, 'steps': 14932, 'loss/train': 1.0893620252609253} +11/06/2021 23:18:26 - INFO - __main__ - Step 14934: {'lr': 0.000490638281352883, 'samples': 2867328, 'steps': 14933, 'loss/train': 1.8908346891403198} +11/06/2021 23:18:26 - INFO - __main__ - Step 14935: {'lr': 0.0004906368426767767, 'samples': 2867520, 'steps': 14934, 'loss/train': 0.6824740767478943} +11/06/2021 23:18:27 - INFO - __main__ - Step 14936: {'lr': 0.0004906354038922432, 'samples': 2867712, 'steps': 14935, 'loss/train': 1.8815536499023438} +11/06/2021 23:18:27 - INFO - __main__ - Step 14937: {'lr': 0.000490633964999283, 'samples': 2867904, 'steps': 14936, 'loss/train': 1.1689196825027466} +11/06/2021 23:18:28 - INFO - __main__ - Step 14938: {'lr': 0.000490632525997897, 'samples': 2868096, 'steps': 14937, 'loss/train': 1.6703389883041382} +11/06/2021 23:18:28 - INFO - __main__ - Step 14939: {'lr': 0.0004906310868880856, 'samples': 2868288, 'steps': 14938, 'loss/train': 1.6411389112472534} +11/06/2021 23:18:29 - INFO - __main__ - Step 14940: {'lr': 0.0004906296476698496, 'samples': 2868480, 'steps': 14939, 'loss/train': 1.2749041318893433} +11/06/2021 23:18:29 - INFO - __main__ - Step 14941: {'lr': 0.0004906282083431897, 'samples': 2868672, 'steps': 14940, 'loss/train': 1.5104907751083374} +11/06/2021 23:18:29 - INFO - __main__ - Step 14942: {'lr': 0.0004906267689081063, 'samples': 2868864, 'steps': 14941, 'loss/train': 1.9198617935180664} +11/06/2021 23:18:30 - INFO - __main__ - Step 14943: {'lr': 0.0004906253293646002, 'samples': 2869056, 'steps': 14942, 'loss/train': 1.7235310077667236} +11/06/2021 23:18:31 - INFO - __main__ - Step 14944: {'lr': 0.0004906238897126721, 'samples': 2869248, 'steps': 14943, 'loss/train': 1.3015567064285278} +11/06/2021 23:18:31 - INFO - __main__ - Step 14945: {'lr': 0.0004906224499523225, 'samples': 2869440, 'steps': 14944, 'loss/train': 1.208406686782837} +11/06/2021 23:18:31 - INFO - __main__ - Step 14946: {'lr': 0.0004906210100835522, 'samples': 2869632, 'steps': 14945, 'loss/train': 1.7185678482055664} +11/06/2021 23:18:32 - INFO - __main__ - Step 14947: {'lr': 0.0004906195701063617, 'samples': 2869824, 'steps': 14946, 'loss/train': 1.6271605491638184} +11/06/2021 23:18:33 - INFO - __main__ - Step 14948: {'lr': 0.0004906181300207518, 'samples': 2870016, 'steps': 14947, 'loss/train': 1.1316771507263184} +11/06/2021 23:18:33 - INFO - __main__ - Step 14949: {'lr': 0.0004906166898267231, 'samples': 2870208, 'steps': 14948, 'loss/train': 1.8571279048919678} +11/06/2021 23:18:34 - INFO - __main__ - Step 14950: {'lr': 0.0004906152495242763, 'samples': 2870400, 'steps': 14949, 'loss/train': 1.3722232580184937} +11/06/2021 23:18:34 - INFO - __main__ - Step 14951: {'lr': 0.0004906138091134118, 'samples': 2870592, 'steps': 14950, 'loss/train': 1.7835454940795898} +11/06/2021 23:18:34 - INFO - __main__ - Step 14952: {'lr': 0.0004906123685941306, 'samples': 2870784, 'steps': 14951, 'loss/train': 1.6602545976638794} +11/06/2021 23:18:35 - INFO - __main__ - Step 14953: {'lr': 0.000490610927966433, 'samples': 2870976, 'steps': 14952, 'loss/train': 1.557942509651184} +11/06/2021 23:18:36 - INFO - __main__ - Step 14954: {'lr': 0.00049060948723032, 'samples': 2871168, 'steps': 14953, 'loss/train': 1.7364459037780762} +11/06/2021 23:18:36 - INFO - __main__ - Step 14955: {'lr': 0.000490608046385792, 'samples': 2871360, 'steps': 14954, 'loss/train': 2.2763864994049072} +11/06/2021 23:18:36 - INFO - __main__ - Step 14956: {'lr': 0.0004906066054328498, 'samples': 2871552, 'steps': 14955, 'loss/train': 1.585302472114563} +11/06/2021 23:18:37 - INFO - __main__ - Step 14957: {'lr': 0.0004906051643714939, 'samples': 2871744, 'steps': 14956, 'loss/train': 1.91652250289917} +11/06/2021 23:18:38 - INFO - __main__ - Step 14958: {'lr': 0.000490603723201725, 'samples': 2871936, 'steps': 14957, 'loss/train': 3.7174441814422607} +11/06/2021 23:18:38 - INFO - __main__ - Step 14959: {'lr': 0.0004906022819235438, 'samples': 2872128, 'steps': 14958, 'loss/train': 1.5262293815612793} +11/06/2021 23:18:38 - INFO - __main__ - Step 14960: {'lr': 0.000490600840536951, 'samples': 2872320, 'steps': 14959, 'loss/train': 1.9472852945327759} +11/06/2021 23:18:39 - INFO - __main__ - Step 14961: {'lr': 0.0004905993990419471, 'samples': 2872512, 'steps': 14960, 'loss/train': 1.6929538249969482} +11/06/2021 23:18:39 - INFO - __main__ - Step 14962: {'lr': 0.0004905979574385328, 'samples': 2872704, 'steps': 14961, 'loss/train': 1.4080133438110352} +11/06/2021 23:18:39 - INFO - __main__ - Step 14963: {'lr': 0.0004905965157267088, 'samples': 2872896, 'steps': 14962, 'loss/train': 1.8805720806121826} +11/06/2021 23:18:41 - INFO - __main__ - Step 14964: {'lr': 0.0004905950739064758, 'samples': 2873088, 'steps': 14963, 'loss/train': 1.8650027513504028} +11/06/2021 23:18:41 - INFO - __main__ - Step 14965: {'lr': 0.0004905936319778343, 'samples': 2873280, 'steps': 14964, 'loss/train': 1.3455829620361328} +11/06/2021 23:18:41 - INFO - __main__ - Step 14966: {'lr': 0.000490592189940785, 'samples': 2873472, 'steps': 14965, 'loss/train': 1.7468905448913574} +11/06/2021 23:18:42 - INFO - __main__ - Step 14967: {'lr': 0.0004905907477953286, 'samples': 2873664, 'steps': 14966, 'loss/train': 1.8428308963775635} +11/06/2021 23:18:42 - INFO - __main__ - Step 14968: {'lr': 0.0004905893055414658, 'samples': 2873856, 'steps': 14967, 'loss/train': 1.5465810298919678} +11/06/2021 23:18:43 - INFO - __main__ - Step 14969: {'lr': 0.0004905878631791971, 'samples': 2874048, 'steps': 14968, 'loss/train': 1.9906973838806152} +11/06/2021 23:18:43 - INFO - __main__ - Step 14970: {'lr': 0.0004905864207085232, 'samples': 2874240, 'steps': 14969, 'loss/train': 1.7254399061203003} +11/06/2021 23:18:44 - INFO - __main__ - Step 14971: {'lr': 0.0004905849781294448, 'samples': 2874432, 'steps': 14970, 'loss/train': 1.8917148113250732} +11/06/2021 23:18:44 - INFO - __main__ - Step 14972: {'lr': 0.0004905835354419625, 'samples': 2874624, 'steps': 14971, 'loss/train': 1.7392559051513672} +11/06/2021 23:18:44 - INFO - __main__ - Step 14973: {'lr': 0.0004905820926460769, 'samples': 2874816, 'steps': 14972, 'loss/train': 1.6358309984207153} +11/06/2021 23:18:45 - INFO - __main__ - Step 14974: {'lr': 0.0004905806497417888, 'samples': 2875008, 'steps': 14973, 'loss/train': 1.6739000082015991} +11/06/2021 23:18:46 - INFO - __main__ - Step 14975: {'lr': 0.0004905792067290988, 'samples': 2875200, 'steps': 14974, 'loss/train': 1.421985387802124} +11/06/2021 23:18:46 - INFO - __main__ - Step 14976: {'lr': 0.0004905777636080075, 'samples': 2875392, 'steps': 14975, 'loss/train': 1.8452321290969849} +11/06/2021 23:18:47 - INFO - __main__ - Step 14977: {'lr': 0.0004905763203785157, 'samples': 2875584, 'steps': 14976, 'loss/train': 1.7335155010223389} +11/06/2021 23:18:47 - INFO - __main__ - Step 14978: {'lr': 0.0004905748770406237, 'samples': 2875776, 'steps': 14977, 'loss/train': 1.7326487302780151} +11/06/2021 23:18:47 - INFO - __main__ - Step 14979: {'lr': 0.0004905734335943325, 'samples': 2875968, 'steps': 14978, 'loss/train': 1.5935941934585571} +11/06/2021 23:18:48 - INFO - __main__ - Step 14980: {'lr': 0.0004905719900396426, 'samples': 2876160, 'steps': 14979, 'loss/train': 1.410271406173706} +11/06/2021 23:18:49 - INFO - __main__ - Step 14981: {'lr': 0.0004905705463765546, 'samples': 2876352, 'steps': 14980, 'loss/train': 1.5823677778244019} +11/06/2021 23:18:49 - INFO - __main__ - Step 14982: {'lr': 0.0004905691026050692, 'samples': 2876544, 'steps': 14981, 'loss/train': 1.2565804719924927} +11/06/2021 23:18:49 - INFO - __main__ - Step 14983: {'lr': 0.0004905676587251873, 'samples': 2876736, 'steps': 14982, 'loss/train': 1.1940447092056274} +11/06/2021 23:18:50 - INFO - __main__ - Step 14984: {'lr': 0.0004905662147369091, 'samples': 2876928, 'steps': 14983, 'loss/train': 2.0281472206115723} +11/06/2021 23:18:50 - INFO - __main__ - Step 14985: {'lr': 0.0004905647706402356, 'samples': 2877120, 'steps': 14984, 'loss/train': 1.4245983362197876} +11/06/2021 23:18:51 - INFO - __main__ - Step 14986: {'lr': 0.0004905633264351673, 'samples': 2877312, 'steps': 14985, 'loss/train': 1.687376856803894} +11/06/2021 23:18:51 - INFO - __main__ - Step 14987: {'lr': 0.0004905618821217048, 'samples': 2877504, 'steps': 14986, 'loss/train': 1.4128832817077637} +11/06/2021 23:18:52 - INFO - __main__ - Step 14988: {'lr': 0.0004905604376998489, 'samples': 2877696, 'steps': 14987, 'loss/train': 1.4120585918426514} +11/06/2021 23:18:52 - INFO - __main__ - Step 14989: {'lr': 0.0004905589931696002, 'samples': 2877888, 'steps': 14988, 'loss/train': 1.6565570831298828} +11/06/2021 23:18:53 - INFO - __main__ - Step 14990: {'lr': 0.0004905575485309593, 'samples': 2878080, 'steps': 14989, 'loss/train': 1.8112573623657227} +11/06/2021 23:18:54 - INFO - __main__ - Step 14991: {'lr': 0.0004905561037839269, 'samples': 2878272, 'steps': 14990, 'loss/train': 1.1115037202835083} +11/06/2021 23:18:54 - INFO - __main__ - Step 14992: {'lr': 0.0004905546589285036, 'samples': 2878464, 'steps': 14991, 'loss/train': 1.6998533010482788} +11/06/2021 23:18:54 - INFO - __main__ - Step 14993: {'lr': 0.0004905532139646901, 'samples': 2878656, 'steps': 14992, 'loss/train': 0.203787699341774} +11/06/2021 23:18:55 - INFO - __main__ - Step 14994: {'lr': 0.000490551768892487, 'samples': 2878848, 'steps': 14993, 'loss/train': 2.0352189540863037} +11/06/2021 23:18:55 - INFO - __main__ - Step 14995: {'lr': 0.000490550323711895, 'samples': 2879040, 'steps': 14994, 'loss/train': 1.996849536895752} +11/06/2021 23:18:56 - INFO - __main__ - Step 14996: {'lr': 0.0004905488784229147, 'samples': 2879232, 'steps': 14995, 'loss/train': 1.7386120557785034} +11/06/2021 23:18:57 - INFO - __main__ - Step 14997: {'lr': 0.000490547433025547, 'samples': 2879424, 'steps': 14996, 'loss/train': 1.7791500091552734} +11/06/2021 23:18:57 - INFO - __main__ - Step 14998: {'lr': 0.0004905459875197921, 'samples': 2879616, 'steps': 14997, 'loss/train': 1.2726280689239502} +11/06/2021 23:18:57 - INFO - __main__ - Step 14999: {'lr': 0.000490544541905651, 'samples': 2879808, 'steps': 14998, 'loss/train': 1.6460684537887573} +11/06/2021 23:18:58 - INFO - __main__ - Step 15000: {'lr': 0.0004905430961831242, 'samples': 2880000, 'steps': 14999, 'loss/train': 0.5816349983215332} +11/06/2021 23:18:58 - INFO - __main__ - Evaluating and saving model checkpoint +11/06/2021 23:22:11 - INFO - __main__ - Step 15000: {'loss/eval': 1.610079050064087, 'perplexity': 5.003206729888916}